0% found this document useful (0 votes)

10K views7 pages

Coe Projects

This document contains code snippets for various predictive analytics and machine learning tasks, including sales forecasting using linear regression, sentiment analysis on social media data, disease prediction using random forest classification on healthcare data, recommendation systems for e-commerce using collaborative filtering, text classification for sentiment analysis using naive bayes, and time series analysis for stock price prediction using random forest regression. The code includes data loading, preprocessing, model training, evaluation, and visualization steps.

Uploaded by

tApIsH

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

10K views7 pages

Coe Projects

Uploaded by

tApIsH

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

coe-projects

February 8, 2024

[ ]: # Predictive Analytics for Sales Forecasting

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error
import matplotlib.pyplot as plt

# load data
sales_data = pd.read_csv('data.csv')
print(sales_data.head())
features = sales_data[['Feature1', 'Feature2', '...']]
target = sales_data['Sales']

# Split data into train and test sets

X_train, X_test, y_train, y_test = train_test_split(features, target,␣
↪test_size=0.2, random_state=42)

# linear regression model

model = LinearRegression()

# Training the model

model.fit(X_train, y_train)

#using Predictive modelling for estimate predictions

predictions = model.predict(X_test)
mse = mean_squared_error(y_test, predictions)
print(f'Mean Squared Error: {mse}')

# Visualizing with matplotlib

plt.scatter(X_test, y_test, color='blue', label='Actual Sales')
plt.scatter(X_test, predictions, color='red', label='Predicted Sales')
plt.xlabel('Feature')
plt.ylabel('Sales')
plt.legend()
plt.show()

1
[ ]: #sentiment analysis on social media data

from textblob import TextBlob

# Sample social media comments/reviews

comments = [
"I love this product! It's amazing!",
"The service was terrible, never using it again.",
"I'm not sure about this brand, needs improvement.",
"Best experience ever, highly recommend!"
]

# Perform sentiment analysis on each comment

for comment in comments:
blob = TextBlob(comment)
sentiment = blob.sentiment.polarity
if sentiment > 0:
print(f"'{comment}' - Positive")
elif sentiment < 0:
print(f"'{comment}' - Negative")
else:
print(f"'{comment}' - Neutral")

'I love this product! It's amazing!' - Positive

'The service was terrible, never using it again.' - Negative
'I'm not sure about this brand, needs improvement.' - Negative
'Best experience ever, highly recommend!' - Positive

[ ]: # health care Analytics disease

# important libraries
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# libraries for modeling & prediction

from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report
from sklearn.impute import SimpleImputer

# Loading file
health_data = pd.read_csv('data.csv')
print(health_data.head())

2
# missing values ko handle kri using SimpleImputer
imputer = SimpleImputer(strategy='mean')
health_data = pd.DataFrame(imputer.fit_transform(health_data),␣
↪columns=health_data.columns)

# relevant features for the model

features = health_data[['Feature1', 'Feature2', '...']]
target = health_data['Disease']

# Split data into train and test sets

X_train, X_test, y_train, y_test = train_test_split(features, target,␣
↪test_size=0.2, random_state=42)

# Random Forest prediction

model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)
# prediction of data
predictions = model.predict(X_test)

# data modeling part

accuracy = accuracy_score(y_test, predictions)
print(f'Accuracy: {accuracy}')
print('Classification Report:\n', classification_report(y_test, predictions))

# Visualize using seaborn and matplotlib

plt.figure(figsize=(8, 6))
sns.countplot(x=predictions, palette='Set2', label='Predicted')
sns.countplot(x=y_test, palette='Pastel1', label='Actual')
plt.xlabel('Disease')
plt.ylabel('Count')
plt.title('Disease Prediction: Predicted vs. Actual')
plt.legend()
plt.show()

[ ]: # recomendation system for e commerce

from surprise import Dataset, Reader, KNNBasic

from surprise.model_selection import train_test_split
from surprise.accuracy import rmse

# Load data
reader = Reader(line_format='user item rating', sep=',', rating_scale=(1, 5))
data = Dataset.load_from_file('data.csv', reader=reader)

# Split data into train and test sets

trainset, testset = train_test_split(data, test_size=0.2)

3
# Build and train the model
sim_options = {'name': 'cosine', 'user_based': True}
model = KNNBasic(sim_options=sim_options)
model.fit(trainset)

# Evaluate the model

predictions = model.test(testset)
rmse(predictions)

# Make recommendations for a user

user_id = '123'
items_to_ignore = [item[0] for item in trainset.ur[int(user_id)]]
top_n = 10
recommendations = model.get_neighbors(int(user_id), k=top_n)
print(recommendations)

[1]: # natural language processing for text classification

import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.naive_bayes import MultinomialNB
from sklearn.metrics import accuracy_score, classification_report

# Sample data - replace with your own dataset

documents = [
("This product is great", "positive"),
("The service was terrible", "negative"),
("The delivery was fast", "positive"),
("I'm never buying from them again", "negative"),
("Worst experience ever", "negative")
]

# Split data into features and labels

X = [doc[0] for doc in documents]
y = [doc[1] for doc in documents]

# Split data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,␣
↪random_state=42)

# Feature extraction using TF-IDF vectorization

vectorizer = TfidfVectorizer()
X_train_vec = vectorizer.fit_transform(X_train)
X_test_vec = vectorizer.transform(X_test)

4
# Build and train a Multinomial Naive Bayes classifier
classifier = MultinomialNB()
classifier.fit(X_train_vec, y_train)

# Predictions
y_pred = classifier.predict(X_test_vec)

# Evaluate the model

accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Classification report
print("\nClassification Report:")
print(classification_report(y_test, y_pred))

Accuracy: 0.00

Classification Report:
precision recall f1-score support

negative 0.00 0.00 0.00 1.0

positive 0.00 0.00 0.00 0.0

accuracy 0.00 1.0

macro avg 0.00 0.00 0.00 1.0
weighted avg 0.00 0.00 0.00 1.0

/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Precision and F-score are ill-defined and being set to
0.0 in labels with no predicted samples. Use `zero_division` parameter to
control this behavior.
_warn_prf(average, modifier, msg_start, len(result))
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0
in labels with no true samples. Use `zero_division` parameter to control this
behavior.
_warn_prf(average, modifier, msg_start, len(result))
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Precision and F-score are ill-defined and being set to
0.0 in labels with no predicted samples. Use `zero_division` parameter to
control this behavior.
_warn_prf(average, modifier, msg_start, len(result))
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0
in labels with no true samples. Use `zero_division` parameter to control this
behavior.
_warn_prf(average, modifier, msg_start, len(result))

5
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Precision and F-score are ill-defined and being set to
0.0 in labels with no predicted samples. Use `zero_division` parameter to
control this behavior.
_warn_prf(average, modifier, msg_start, len(result))
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classification.py:1344:
UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0
in labels with no true samples. Use `zero_division` parameter to control this
behavior.
_warn_prf(average, modifier, msg_start, len(result))

[ ]: # time series analysis for stock price prediction

import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_squared_error
import matplotlib.pyplot as plt

# Load historical stock price data

# Replace 'stock_data.csv' with your dataset file path or API call to fetch data
stock_data = pd.read_csv('data.csv')

# Calculate financial indicators (e.g., moving averages, RSI, MACD, etc.)

# Here, we'll use a simple moving average as an example
window = 30
stock_data['SMA'] = stock_data['Close'].rolling(window=window).mean()

# Define features and target variable

features = ['SMA'] # Add more financial indicators as needed
target = 'Close'

# Drop rows with missing values

stock_data.dropna(inplace=True)

# Split data into features and target variable

X = stock_data[features]
y = stock_data[target]

# Split data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,␣
↪random_state=42)

# Train a Random Forest regressor

rf_regressor = RandomForestRegressor(n_estimators=100, random_state=42)

6
rf_regressor.fit(X_train, y_train)

# Make predictions
y_pred_train = rf_regressor.predict(X_train)
y_pred_test = rf_regressor.predict(X_test)

# Evaluate the model

train_rmse = np.sqrt(mean_squared_error(y_train, y_pred_train))
test_rmse = np.sqrt(mean_squared_error(y_test, y_pred_test))
print(f"Train RMSE: {train_rmse:.2f}")
print(f"Test RMSE: {test_rmse:.2f}")

# Plot actual vs. predicted prices

plt.figure(figsize=(10, 6))
plt.plot(stock_data.index, stock_data['Close'], label='Actual Price')
plt.plot(stock_data.index, np.concatenate((y_pred_train, y_pred_test)),␣
↪label='Predicted Price')

plt.title('Stock Price Prediction')

plt.xlabel('Date')
plt.ylabel('Price')
plt.legend()
plt.show()

Toshiba - E7239X Datasheet
50% (2)
Toshiba - E7239X Datasheet
16 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
Predictive Modeling Machine Learning
No ratings yet
Predictive Modeling Machine Learning
16 pages
AI
No ratings yet
AI
16 pages
Decision Tree
No ratings yet
Decision Tree
6 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
ML PDF
No ratings yet
ML PDF
30 pages
ML Internal Answers
No ratings yet
ML Internal Answers
9 pages
Unit2 ML Programs
No ratings yet
Unit2 ML Programs
7 pages
ML Lab-1
No ratings yet
ML Lab-1
32 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
Ds Notes Mca
No ratings yet
Ds Notes Mca
30 pages
Data Analytics
No ratings yet
Data Analytics
10 pages
CR Lab
No ratings yet
CR Lab
5 pages
1
No ratings yet
1
13 pages
ML Algorithms
100% (1)
ML Algorithms
1 page
Big Data Practical
No ratings yet
Big Data Practical
20 pages
AI Assignment-6
No ratings yet
AI Assignment-6
7 pages
Machine Learning Assignment 1
No ratings yet
Machine Learning Assignment 1
4 pages
VND - Openxmlformats Officedocument - Wordprocessingml.document&rendition 1
No ratings yet
VND - Openxmlformats Officedocument - Wordprocessingml.document&rendition 1
24 pages
Task 4
No ratings yet
Task 4
2 pages
ML
No ratings yet
ML
17 pages
How To Create A Python Model
No ratings yet
How To Create A Python Model
29 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
Report
No ratings yet
Report
14 pages
Python For Data Science IA 1 Programs
No ratings yet
Python For Data Science IA 1 Programs
14 pages
A3 Classification and Feature Engineering
No ratings yet
A3 Classification and Feature Engineering
2 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
LAB MANUAL For Machine Learning
No ratings yet
LAB MANUAL For Machine Learning
15 pages
ML Lab
No ratings yet
ML Lab
7 pages
3 Classification
No ratings yet
3 Classification
16 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
Machine Learning Lab Manual
No ratings yet
Machine Learning Lab Manual
22 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
Report On Stock Price Prediction
No ratings yet
Report On Stock Price Prediction
14 pages
AI and ML Lab Ex3 To 12
No ratings yet
AI and ML Lab Ex3 To 12
27 pages
Ashwin Report
No ratings yet
Ashwin Report
18 pages
ML Manual With Outputs
No ratings yet
ML Manual With Outputs
30 pages
ML Lab Programs
No ratings yet
ML Lab Programs
9 pages
F 11
No ratings yet
F 11
3 pages
Prathamesh KRAI
No ratings yet
Prathamesh KRAI
38 pages
Random Forest
No ratings yet
Random Forest
11 pages
Python For Data Science IA 1 Programs
No ratings yet
Python For Data Science IA 1 Programs
14 pages
Machine
100% (1)
Machine
45 pages
Scikit Learn What Were Covering
No ratings yet
Scikit Learn What Were Covering
15 pages
PA Lab2
No ratings yet
PA Lab2
11 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
MLT 1 - 7 Kanish
No ratings yet
MLT 1 - 7 Kanish
24 pages
Building, Tuning, and Deploying Models
No ratings yet
Building, Tuning, and Deploying Models
11 pages
ML Practical 205160694034
No ratings yet
ML Practical 205160694034
33 pages
ML Experiments TerminalStyle Corrected
No ratings yet
ML Experiments TerminalStyle Corrected
6 pages
Aiml Practical
No ratings yet
Aiml Practical
17 pages
Machine Learning Cheatsheet
No ratings yet
Machine Learning Cheatsheet
5 pages
Sklearn
No ratings yet
Sklearn
141 pages
Case Study - Classifier
No ratings yet
Case Study - Classifier
5 pages
Minor Project
No ratings yet
Minor Project
21 pages
AI Lab M.Tech
No ratings yet
AI Lab M.Tech
29 pages
DATA MINING AND MACHINE LEARNING. PREDICTIVE TECHNIQUES: REGRESSION, GENERALIZED LINEAR MODELS, SUPPORT VECTOR MACHINE AND NEURAL NETWORKS
From Everand
DATA MINING AND MACHINE LEARNING. PREDICTIVE TECHNIQUES: REGRESSION, GENERALIZED LINEAR MODELS, SUPPORT VECTOR MACHINE AND NEURAL NETWORKS
César Pérez López
No ratings yet
Python For Beginners
From Everand
Python For Beginners
Célio Azevedo
No ratings yet
Data Modeling With Graph Databases
100% (2)
Data Modeling With Graph Databases
68 pages
June 2015 QP - Unit 1 WJEC Chemistry A-Level
No ratings yet
June 2015 QP - Unit 1 WJEC Chemistry A-Level
26 pages
Datasheet Item 4 SQ 12403653
No ratings yet
Datasheet Item 4 SQ 12403653
7 pages
My Bank Statement
No ratings yet
My Bank Statement
3 pages
1597 KI Avant Tone Horn S140 HELLA EN
No ratings yet
1597 KI Avant Tone Horn S140 HELLA EN
2 pages
Dell Latitude PDF
No ratings yet
Dell Latitude PDF
8 pages
Android Debug Bridge (Adb)
No ratings yet
Android Debug Bridge (Adb)
24 pages
MagNet - Introduction
No ratings yet
MagNet - Introduction
141 pages
WRE301 Chapter 4
No ratings yet
WRE301 Chapter 4
93 pages
fl23 Algebra1 Ipe 03 07
No ratings yet
fl23 Algebra1 Ipe 03 07
10 pages
VFR Navigation
No ratings yet
VFR Navigation
3 pages
Japanese Cheesecake
No ratings yet
Japanese Cheesecake
1 page
A571a571m 01 (2011)
No ratings yet
A571a571m 01 (2011)
5 pages
Chapter 6 Continuous Probability Distribution
No ratings yet
Chapter 6 Continuous Probability Distribution
47 pages
R.N. Kapoor Memorial Homoeopathic Hospital & Medical College, INDORE
100% (3)
R.N. Kapoor Memorial Homoeopathic Hospital & Medical College, INDORE
13 pages
40XV648U, 46XV648U and 52XV648U: Firmware Installation Notice
No ratings yet
40XV648U, 46XV648U and 52XV648U: Firmware Installation Notice
2 pages
01a IGCSE Maths 4MB1 01 - January 2021 Examination Paper
No ratings yet
01a IGCSE Maths 4MB1 01 - January 2021 Examination Paper
24 pages
Statistics With R Unit 1: Divya Arun Kumar
No ratings yet
Statistics With R Unit 1: Divya Arun Kumar
65 pages
OOPs Lab Manual
0% (1)
OOPs Lab Manual
88 pages
Fiitjee All India Test Series: JEE (Advanced) - 2020
No ratings yet
Fiitjee All India Test Series: JEE (Advanced) - 2020
19 pages
SL2020-692 LDCL Update PDF
No ratings yet
SL2020-692 LDCL Update PDF
7 pages
Slab Punching H11
No ratings yet
Slab Punching H11
10 pages
Manual HC For in Rack Sprinklers Reference NFPA 13 - 2013, Chapter 23 (PLANS AND CALCULATIONS) (Mehboob Shaikh)
100% (1)
Manual HC For in Rack Sprinklers Reference NFPA 13 - 2013, Chapter 23 (PLANS AND CALCULATIONS) (Mehboob Shaikh)
16 pages
4082WWT Grit Removal
No ratings yet
4082WWT Grit Removal
21 pages
Datasheet PSR30 600 70
No ratings yet
Datasheet PSR30 600 70
6 pages
ASTM Seminar - Finnie - ReleaseRate
No ratings yet
ASTM Seminar - Finnie - ReleaseRate
21 pages
Is 13882
No ratings yet
Is 13882
44 pages
U-Bracket Used For Wall Mounting
No ratings yet
U-Bracket Used For Wall Mounting
3 pages
Assignment - I
No ratings yet
Assignment - I
4 pages

Note: This service is not intended for secure transactions such as banking, social media, email, or purchasing. Use at your own risk. We assume no liability whatsoever for broken pages.

Coe Projects

Uploaded by

Coe Projects

Uploaded by

coe-projects

[ ]: # Predictive Analytics for Sales Forecasting

# Split data into train and test sets

# linear regression model

# Training the model

#using Predictive modelling for estimate predictions

# Visualizing with matplotlib

from textblob import TextBlob

# Sample social media comments/reviews

# Perform sentiment analysis on each comment

'I love this product! It's amazing!' - Positive

[ ]: # health care Analytics disease

# libraries for modeling & prediction

# relevant features for the model

# Split data into train and test sets

# Random Forest prediction

# data modeling part

# Visualize using seaborn and matplotlib

[ ]: # recomendation system for e commerce

from surprise import Dataset, Reader, KNNBasic

# Split data into train and test sets

# Evaluate the model

# Make recommendations for a user

[1]: # natural language processing for text classification

# Sample data - replace with your own dataset

# Split data into features and labels

# Split data into training and testing sets

# Feature extraction using TF-IDF vectorization

# Evaluate the model

negative 0.00 0.00 0.00 1.0

accuracy 0.00 1.0

[ ]: # time series analysis for stock price prediction

# Load historical stock price data

# Calculate financial indicators (e.g., moving averages, RSI, MACD, etc.)

# Define features and target variable

# Drop rows with missing values

# Split data into features and target variable

# Split data into training and testing sets

# Train a Random Forest regressor

# Evaluate the model

# Plot actual vs. predicted prices

plt.title('Stock Price Prediction')

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.