Random Forest

RANDOM FORST ALGORITHM
ALL ALGORITHMS USING BY 21 DATASET (text3)document
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report
# Read data from Excel file

file_path = '/content/ai.xlsx' # Replace with your actual file path
df = pd.read_excel(file_path)
# Assuming your Excel file has columns 'text' and 'label' for text data and labels
X = df['text'].astype(str)
y = df['label']
# Split the dataset into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)
# Vectorize the text data using TF-IDF

vectorizer = TfidfVectorizer(max_features=5000)
X_train_tfidf = vectorizer.fit_transform(X_train)
X_test_tfidf = vectorizer.transform(X_test)
# Train a Random Forest classifier

classifier = RandomForestClassifier(n_estimators=100, random_state=42)
classifier.fit(X_train_tfidf, y_train)
# Make predictions on the test set

y_pred = classifier.predict(X_test_tfidf)
# Print the results including accuracy value

print(f'Accuracy: {accuracy:.4f}') # Adjusted to display accuracy with 4 decimal
places
print('\nClassification Report:')
# The classification report is based on the actual predictions, so it won't change
with this modification
print(classification_report(y_test, y_pred))
Accuracy: 0.7500
Classification Report:
precision recall f1-score support
0 1.00 1.00 1.00 2

1 1.00 1.00 1.00 2
accuracy 1.00 4
macro avg 1.00 1.00 1.00 4
weighted avg 1.00 1.00 1.00 4
XGBOOST CLASSIFIER ALGORITHM
import pandas as pd
from xgboost import XGBClassifier

y = df['label']

random_state=42)

# Train an XGBoost classifier

classifier = XGBClassifier()


places
Accuracy: 0.7500
0 0.50 0.50 0.50 2

1 0.50 0.50 0.50 2
accuracy 0.50 4
macro avg 0.50 0.50 0.50 4
weighted avg 0.50 0.50 0.50 4
SVM CLASSIFIER ALGORITHM
import pandas as pd
from sklearn.svm import LinearSVC

y = df['label']

random_state=42)

# Train a linear SVM classifier

classifier = LinearSVC()


places
Accuracy: 0.7500
0 1.00 1.00 1.00 2

1 1.00 1.00 1.00 2
accuracy 1.00 4
macro avg 1.00 1.00 1.00 4
weighted avg 1.00 1.00 1.00 4
NAIVE BAYES ALGORITHM
import pandas as pd
from sklearn.naive_bayes import MultinomialNB

file_path = '/content/text3.csv' # Replace with your actual file path
df = pd.read_csv(file_path)
y = df['label']
random_state=42)

# Train a Multinomial Naive Bayes classifier

classifier = MultinomialNB()

# Evaluate the model

accuracy = accuracy_score(y_test, y_pred)
report = classification_report(y_test, y_pred)
# Print the results

print(f'Accuracy: {accuracy}')
print(report)
Accuracy: 0.75
0 0.67 1.00 0.80 2

1 1.00 0.50 0.67 2
accuracy 0.75 4
macro avg 0.83 0.75 0.73 4
weighted avg 0.83 0.75 0.73 4
SVM CLASSIFIER
import pandas as pd
from sklearn.ensemble import RandomForestClassifier

file_path = '/content/text3.csv' # Replace with your actual file path
df = pd.read_csv(file_path)
y = df['label']

random_state=42)

# Train a Random Forest classifier

classifier = RandomForestClassifier(n_estimators=100, random_state=42)


places
Accuracy: 0.8
0 1.00 1.00 1.00 2

1 1.00 1.00 1.00 2
accuracy 1.00 4
macro avg 1.00 1.00 1.00 4
weighted avg 1.00 1.00 1.00 4

Random Forest

Uploaded by

Copyright:

Available Formats

Random Forest

Uploaded by

Document Information

Original Title

Copyright

Available Formats

Share this document

Share or Embed Document

Sharing Options

Did you find this document useful?

Is this content inappropriate?

Copyright:

Available Formats

Random Forest

Uploaded by

Copyright:

Available Formats

RANDOM FORST ALGORITHM

ALL ALGORITHMS USING BY 21 DATASET (text3)document

from sklearn.metrics import accuracy_score, classification_report

# Read data from Excel file

# Split the dataset into training and testing sets

# Vectorize the text data using TF-IDF

# Train a Random Forest classifier

# Make predictions on the test set

# Print the results including accuracy value

0 1.00 1.00 1.00 2

XGBOOST CLASSIFIER ALGORITHM

# Read data from Excel file

# Split the dataset into training and testing sets

# Vectorize the text data using TF-IDF

# Train an XGBoost classifier

# Make predictions on the test set

# Print the results including accuracy value

0 0.50 0.50 0.50 2

SVM CLASSIFIER ALGORITHM

# Read data from Excel file

# Split the dataset into training and testing sets

# Vectorize the text data using TF-IDF

# Train a linear SVM classifier

# Make predictions on the test set

# Print the results including accuracy value

0 1.00 1.00 1.00 2

NAIVE BAYES ALGORITHM

# Read data from Excel file

# Vectorize the text data using TF-IDF

# Train a Multinomial Naive Bayes classifier

# Make predictions on the test set

# Evaluate the model

# Print the results

0 0.67 1.00 0.80 2

# Read data from Excel file

# Split the dataset into training and testing sets

# Vectorize the text data using TF-IDF

# Train a Random Forest classifier

# Make predictions on the test set

# Print the results including accuracy value

0 1.00 1.00 1.00 2

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.