0% found this document useful (0 votes)

21 views10 pages

Codingan Materi

Uploaded by

David Baridji

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

21 views10 pages

Codingan Materi

Uploaded by

David Baridji

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 10

4/2/24, 5:39 PM Analisis sentimen Gojek V4.

8 | Random Forest - Colaboratory

# IMPORTANT: RUN THIS CELL IN ORDER TO IMPORT YOUR KAGGLE DATA SOURCES
# TO THE CORRECT LOCATION (/kaggle/input) IN YOUR NOTEBOOK,
# THEN FEEL FREE TO DELETE THIS CELL.
# NOTE: THIS NOTEBOOK ENVIRONMENT DIFFERS FROM KAGGLE'S PYTHON
# ENVIRONMENT SO THERE MAY BE MISSING LIBRARIES USED BY YOUR
# NOTEBOOK.

import os
import sys
from tempfile import NamedTemporaryFile
from urllib.request import urlopen
from urllib.parse import unquote, urlparse
from urllib.error import HTTPError
from zipfile import ZipFile
import tarfile
import shutil

CHUNK_SIZE = 40960
DATA_SOURCE_MAPPING = 'gojek-app-reviews-bahasa-indonesia:https%3A%2F%2Ffanyv88.com%3A443%2Fhttps%2Fstorage.googleapis.com%2Fkaggle-data-sets%2F4394044%2F7545387%2Fbundle

KAGGLE_INPUT_PATH='/kaggle/input'
KAGGLE_WORKING_PATH='/kaggle/working'
KAGGLE_SYMLINK='kaggle'

!umount /kaggle/input/ 2> /dev/null

shutil.rmtree('/kaggle/input', ignore_errors=True)
os.makedirs(KAGGLE_INPUT_PATH, 0o777, exist_ok=True)
os.makedirs(KAGGLE_WORKING_PATH, 0o777, exist_ok=True)

try:
os.symlink(KAGGLE_INPUT_PATH, os.path.join("..", 'input'), target_is_directory=True)
except FileExistsError:
pass
try:
os.symlink(KAGGLE_WORKING_PATH, os.path.join("..", 'working'), target_is_directory=True)
except FileExistsError:
pass

for data_source_mapping in DATA_SOURCE_MAPPING.split(','):

directory, download_url_encoded = data_source_mapping.split(':')
download_url = unquote(download_url_encoded)
filename = urlparse(download_url).path
destination_path = os.path.join(KAGGLE_INPUT_PATH, directory)
try:
with urlopen(download_url) as fileres, NamedTemporaryFile() as tfile:
total_length = fileres.headers['content-length']
print(f'Downloading {directory}, {total_length} bytes compressed')
dl = 0
data = fileres.read(CHUNK_SIZE)
while len(data) > 0:
dl += len(data)
tfile.write(data)
done = int(50 * dl / int(total_length))
sys.stdout.write(f"\r[{'=' * done}{' ' * (50-done)}] {dl} bytes downloaded")
sys.stdout.flush()
data = fileres.read(CHUNK_SIZE)
if filename.endswith('.zip'):
with ZipFile(tfile) as zfile:
zfile.extractall(destination_path)
else:
with tarfile.open(tfile.name) as tarfile:
tarfile.extractall(destination_path)
print(f'\nDownloaded and uncompressed: {directory}')
except HTTPError as e:
print(f'Failed to load (likely expired) {download_url} to path {destination_path}')
continue
except OSError as e:
print(f'Failed to load {download_url} to path {destination_path}')
continue

print('Data source import complete.')

account_circle Downloading gojek-app-reviews-bahasa-indonesia, 8220381 bytes compressed

[==================================================] 8220381 bytes downloaded

# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra

import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory

# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
for filename in filenames:
print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save &
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session

/kaggle/input/gojek-app-reviews-bahasa-indonesia/GojekAppReviewV4.0.0-V4.9.3_Cleaned.csv

keyboard_arrow_down Load Data

df = pd.read_csv('/kaggle/input/gojek-app-reviews-bahasa-indonesia/GojekAppReviewV4.0.0-V4.9.3_Cleaned.csv')
df.head()

userName content score at appVersion

2022-01-21
0 Yuga Edit akun gopay saya di blok 1 4.9.3
10:52:12

Lambat sekali sekarang ini 2021-11-30

1 ff burik 3 4.9.3
bosssku apk gojek g... 15:40:38

Anisa Suci Kenapa sih dari kemarin sy 2021-11-29

2 4 4.9.3
Rahmayuliani buka aplikasi gojek... 22:58:12

Baru download gojek dan hape 2022-09-03

3 naoki yakuza 1 493

keyboard_arrow_down EDA & Preprocessing

import seaborn as sns
import matplotlib.pyplot as plt

sum(df['appVersion'].str.startswith("4.8"))

8091

# ambil kolom yg dibutuhkan

df = df[df['appVersion'].str.startswith("4.8")]
df = df.loc[:, ['userName', 'content', 'score']]

df.head()

userName content score

133 Abu karim aljabbar Mkatiksaidi Ramah banget 5

134 Fathan Mubina Setelah update kok nggak bisa dibuka 4

135 Nyauw Jin Fie Good 5

136 Tanaka Kun Good 5

137 Anton S. Sangat membantu 5

Next steps: toggle_off View recommended plots

# hapus duplikasi
df = df.dropna(subset=['content']).drop_duplicates()

# stopwords
stop_words = stopwords.words('indonesian') + stopwords.words('english') + ["yg", "gak", "ngisi", "udah", "d", "sih", "nya", "srg", "utk", "b
df['content'] = df['content'].apply(lambda x: [word.lower() for word in word_tokenize(x) if (word.isalpha() and word.lower() not in stop_wor

# normalisasi teks
df['content'] = df['content'].apply(lambda x: ' '.join(x))

df.head()

[nltk_data] Downloading package stopwords to /root/nltk_data...

[nltk_data] Unzipping corpora/stopwords.zip.
[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data] Unzipping tokenizers/punkt.zip.
userName content score

133 Abu karim aljabbar Mkatiksaidi ramah banget 5

134 Fathan Mubina update nggak dibuka 4

135 Nyauw Jin Fie good 5

136 Tanaka Kun good 5

137 Anton S. membantu 5

Next steps: toggle_off View recommended plots

!pip install Sastrawi

!pip install VaderSentiment

Collecting Sastrawi
Downloading Sastrawi-1.0.1-py2.py3-none-any.whl (209 kB)
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 209.7/209.7 kB 2.0 MB/s eta 0:00:00
Installing collected packages: Sastrawi
Successfully installed Sastrawi-1.0.1
Collecting VaderSentiment
Downloading vaderSentiment-3.3.2-py2.py3-none-any.whl (125 kB)
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 126.0/126.0 kB 1.3 MB/s eta 0:00:00
Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from VaderSentiment) (2.31.0)
Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->VaderSentiment) (3.3.
Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->VaderSentiment) (3.6)
Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->VaderSentiment) (2.0.7)
Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->VaderSentiment) (2024.2.2)
Installing collected packages: VaderSentiment
Successfully installed VaderSentiment-3.3.2

# stemming
from Sastrawi.Stemmer.StemmerFactory import StemmerFactory

stemmer = StemmerFactory().create_stemmer()
df['content'] = df['content'].apply(lambda x: ' '.join([stemmer.stem(word) for word in x.split()]))

df.head(5)

userName content score

133 Abu karim aljabbar Mkatiksaidi ramah banget 5

134 Fathan Mubina update nggak buka 4

135 Nyauw Jin Fie good 5

136 Tanaka Kun good 5

137 Anton S. bantu 5

Next steps: toggle_off View recommended plots

# labelling
from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer

analyzer = SentimentIntensityAnalyzer()

additional_lexicon_id = {
'kecewa': -0.4,
'rugi': -1,
'buruk': -0.6,
'jelek': -0.6,
'lelet': -0.7,
'gagal': -0.5,
'parah': -0.6,
'mahal': -0.3,
'tolong': -0.1,
'hilang': -0.3,
'gajelas': -0.3,
'gj': -0.3,
'promo': 0.6,
'kadang': -0.1,
'maling': -0.5,
'ganggu': 0.3,
'sedot': -0.5,
'bagus': 0.5,
'pulsa': 0,
'potong': -1,
'baik': 0.5,
'kntl': -1,
'ngelag': -0.8,
'salah': -0.5,
'bintang': 0,
'benerin': -0.4,
'lambat': -0.8,
'siput': -0.4,
'mati': -0.7,
'minimal': -0.3,
'susah': -0.6,
'nagih': -0.6,
'capek': -0.7,
'kacau': -0.3,
'tagih': -0.3,
'mantap': 1,
'puas': 0.9,
'sampah': -0.5,
'sulit': -0.6,
'aneh': -0.4,
}

analyzer.lexicon.update(additional_lexicon_id)

df['sentimen'] = df['content'].apply(lambda x: 'Positif' if analyzer.polarity_scores(x)['compound'] > 0 else ('Negatif' if analyzer.polarity

userName content score sentimen

Abu karim aljabbar

133 ramah banget 5 Netral
Mkatiksaidi

134 Fathan Mubina update nggak buka 4 Netral

135 Nyauw Jin Fie good 5 Positif

136 Tanaka Kun good 5 Positif

137 Anton S. bantu 5 Netral

... ... ... ... ...

8219 Malik Azis gopay mantap 5 Positif

buka aplnya hapus download beberpa

8220 Zunus 1 Netral
kali restar...

8221 Mutiara Purnama bye bye gojek alih ijo lah mantapp 1 Netral

8222 Melanie Anggi fitur gomed ya 5 Netral

8223 Ade Nurul Hidayah go food mahal ah 1 Negatif

Next steps: toggle_off View recommended plots

# TF-IDF
from sklearn.feature_extraction.text import TfidfVectorizer

tfidf_vectorizer = TfidfVectorizer()
X_tfidf = tfidf_vectorizer.fit_transform(df['content'])

keyboard_arrow_down Analisis Sentimen

from wordcloud import WordCloud
from plotly import graph_objs as go
import plotly.express as px
import plotly.figure_factory as ff
from collections import Counter

keyboard_arrow_down WordCloud

df_netral = df[df['sentimen'] == 'Netral']

all_words_netral = ' '.join([twts for twts in df_netral['content']])
wordcloud_netral = WordCloud(width=500, height=300, random_state=21, max_font_size=110).generate(all_words_netral)

plt.imshow(wordcloud_netral, interpolation="bilinear")
# plt.axis('off')
plt.title('Word Cloud dari Sentimen Netral')
plt.show()

plt.imshow(wordcloud_positif, interpolation="bilinear")
# plt.axis('off')
plt.title('Word Cloud dari Sentimen Positif')
plt.show()

df_negatif = df[df['sentimen'] == 'Negatif']

all_words_negatif = ' '.join([twts for twts in df_negatif['content']])
wordcloud_negatif = WordCloud(width=500, height=300, random_state=21, max_font_size=110).generate(all_words_negatif)

plt.imshow(wordcloud_negatif, interpolation="bilinear")
# plt.axis('off')
plt.title('Word Cloud dari Sentimen Negatif')
plt.show()

keyboard_arrow_down Distribusi Target

temp = df.groupby('sentimen').count()['content'].reset_index().sort_values(by='content',ascending=False)
temp.style.background_gradient(cmap='inferno_r')

sentimen content

1 Netral 3987

2 Positif 2541

0 Negatif 1562

plt.figure(figsize=(12,6))
sns.countplot(x='sentimen',data=df)

<Axes: xlabel='sentimen', ylabel='count'>

fig = go.Figure(go.Funnelarea(
text =temp.sentimen,
values = temp.content,
title = {"position": "top center", "text": "Funnel-Chart dari Distribusi target"}
))
fig.show()

Funnel-Chart

!pip install palettable

from palettable.colorbrewer.qualitative import Pastel1_7

Collecting palettable
Downloading palettable-3.3.3-py2.py3-none-any.whl (332 kB)
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 332.3/332.3 kB 2.2 MB/s eta 0:00:00
Installing collected packages: palettable
Successfully installed palettable-3.3.3

https://colab.research.google.com/#fileId=https%3A//storage.googleapis.com/kaggle-colab-exported-notebooks/analisis-sentimen-gojek-v4-8-rando… 7/10
4/2/24, 5:39 PM Analisis sentimen Gojek V4.8 | Random Forest - Colaboratory
unique_netral_words = df_netral['content'].str.split(expand=True).stack().value_counts().reset_index()
unique_netral_words.columns = ['words', 'count']
top_20_words = unique_netral_words.head(12)
plt.figure(figsize=(12, 6))
my_circle = plt.Circle((0, 0), 0.7, color='white')
plt.pie(top_20_words['count'], labels=top_20_words['words'], colors=Pastel1_7.hex_colors)
plt.gca().add_artist(my_circle)
plt.title('Donut Plot dari Sentimen Netral')
plt.show()

unique_positif_words = df_positif['content'].str.split(expand=True).stack().value_counts().reset_index()
unique_positif_words.columns = ['words', 'count']
top_20_words = unique_positif_words.head(12)
plt.figure(figsize=(12, 6))
my_circle = plt.Circle((0, 0), 0.7, color='white')
plt.pie(top_20_words['count'], labels=top_20_words['words'], colors=Pastel1_7.hex_colors)
plt.gca().add_artist(my_circle)
plt.title('Donut Plot dari Sentimen positif')
plt.show()

https://colab.research.google.com/#fileId=https%3A//storage.googleapis.com/kaggle-colab-exported-notebooks/analisis-sentimen-gojek-v4-8-rando… 8/10
4/2/24, 5:39 PM Analisis sentimen Gojek V4.8 | Random Forest - Colaboratory
unique_negatif_words = df_negatif['content'].str.split(expand=True).stack().value_counts().reset_index()
unique_negatif_words.columns = ['words', 'count']
top_20_words = unique_negatif_words.head(12)
plt.figure(figsize=(12, 6))
my_circle = plt.Circle((0, 0), 0.7, color='white')
plt.pie(top_20_words['count'], labels=top_20_words['words'], colors=Pastel1_7.hex_colors)
plt.gca().add_artist(my_circle)
plt.title('Donut Plot dari Sentimen negatif')
plt.show()

keyboard_arrow_down SPLIT

# splitting
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(X_tfidf, df['sentimen'], test_size=0.2, random_state=42)

X_train.shape, X_test.shape

((6472, 6961), (1618, 6961))

keyboard_arrow_down Resampling target

from imblearn.over_sampling import SMOTE

smote = SMOTE(random_state=42)
X_train, y_train = smote.fit_resample(X_train, y_train)

plt.figure(figsize=(12, 6))
sns.countplot(x=y_train)
plt.title('Distribusi target untuk modeling')
plt.show()

keyboard_arrow_down Model
from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import RandomizedSearchCV

# init parameters
rf_param_grid = {'n_estimators': [50, 100, 200],
'max_depth': [None, 10, 20, 30],
'min_samples_split': [2, 5, 10],
'min_samples_leaf': [1, 2, 4]}

keyboard_arrow_down Random Forest

rf_model = RandomizedSearchCV(RandomForestClassifier(random_state=42), rf_param_grid, n_iter=10, cv=5, scoring='accuracy', random_state=42)
rf_model.fit(X_train, y_train)

▸ RandomizedSearchCV
▸ estimator: RandomForestClassifier

▸ RandomForestClassifier

keyboard_arrow_down Model Eval

# print best param
print("\nBest Parameters for Random Forest:", rf_model.best_params_)

Best Parameters for Random Forest: {'n_estimators': 100, 'min_samples_split': 5, 'min_samples_leaf': 1, 'max_depth': None}

# evaluasi model
from sklearn.metrics import classification_report

y_pred_rf = rf_model.best_estimator_.predict(X_test)

print("\n\nClassification Report for Random Forest (Tuned):")

print(classification_report(y_test, y_pred_rf))

Classification Report for Random Forest (Tuned):

precision recall f1-score support

Negatif 0.84 0.93 0.88 310

Netral 0.96 0.96 0.96 803
Positif 0.98 0.91 0.94 505

https://colab.research.google.com/#fileId=https%3A//storage.googleapis.com/kaggle-colab-exported-notebooks/analisis-sentimen-gojek-v4-8-rando… 10/10

Apache Nifi Tutorial PDF
100% (1)
Apache Nifi Tutorial PDF
67 pages
Argonaut Install Guide 3
No ratings yet
Argonaut Install Guide 3
15 pages
35 Tricky and Complex Unix Interview Questions and Commands
No ratings yet
35 Tricky and Complex Unix Interview Questions and Commands
8 pages
ISX15 CM2250 ZYDEL v4 ZyNoT (Licensed To Smokn Stacks)
100% (3)
ISX15 CM2250 ZYDEL v4 ZyNoT (Licensed To Smokn Stacks)
14 pages
e2gRuleWriter Decision Table Software - e2gRuleEngine Knowledge Base Generator
No ratings yet
e2gRuleWriter Decision Table Software - e2gRuleEngine Knowledge Base Generator
20 pages
!!read Me Firmware Instructions!!
100% (1)
!!read Me Firmware Instructions!!
4 pages
Cat Vs Dog
No ratings yet
Cat Vs Dog
292 pages
Reversing Apks: Example Lab
No ratings yet
Reversing Apks: Example Lab
10 pages
07 VESDA-E VEU-VEP Firmware Upgrade Tech Tip A4 IE Lores
No ratings yet
07 VESDA-E VEU-VEP Firmware Upgrade Tech Tip A4 IE Lores
11 pages
How To Install Oracle Apex 5.0 With Database 12C
0% (1)
How To Install Oracle Apex 5.0 With Database 12C
41 pages
2025-03-30
No ratings yet
2025-03-30
24 pages
Backup4all 4 Professional User Manual
No ratings yet
Backup4all 4 Professional User Manual
220 pages
DH VTHX421H MultiLang SIP EMEA V4.800.0000000.0.R.241114 Release Notes
No ratings yet
DH VTHX421H MultiLang SIP EMEA V4.800.0000000.0.R.241114 Release Notes
8 pages
Normal Abnormal Ear - Ipynb - Colab
No ratings yet
Normal Abnormal Ear - Ipynb - Colab
10 pages
Applio - Installation
No ratings yet
Applio - Installation
5 pages
Basic Commands For Os
No ratings yet
Basic Commands For Os
12 pages
EMA-204-Technical-Software and System Update Quick Manual (ENG) v1.2 - 1.2.0.7
No ratings yet
EMA-204-Technical-Software and System Update Quick Manual (ENG) v1.2 - 1.2.0.7
7 pages
PRPC Certification Bullet Points
100% (14)
PRPC Certification Bullet Points
61 pages
Upgrade DB 10.2.0.4 12.1.0
No ratings yet
Upgrade DB 10.2.0.4 12.1.0
15 pages
BeyondTrust CA SDM Integration
No ratings yet
BeyondTrust CA SDM Integration
20 pages
2017 Quadfecta Simcenter Hands On Workshop Motion PDF
No ratings yet
2017 Quadfecta Simcenter Hands On Workshop Motion PDF
92 pages
Bartender Commander Examples
No ratings yet
Bartender Commander Examples
19 pages
Changelog
No ratings yet
Changelog
15 pages
How To Burn MP3+G (Karaoke) To Disc
100% (3)
How To Burn MP3+G (Karaoke) To Disc
10 pages
Free Net With Psiphon
No ratings yet
Free Net With Psiphon
5 pages
Mill 2D & Solids: Handbook Volume 1
No ratings yet
Mill 2D & Solids: Handbook Volume 1
51 pages
Description: Tags: CODTechnicalReferencev3
No ratings yet
Description: Tags: CODTechnicalReferencev3
20 pages
Bugreport CLT L29 HUAWEICLT L29 2018 06 11 21 40 23 Dumpstate - Log 9571
No ratings yet
Bugreport CLT L29 HUAWEICLT L29 2018 06 11 21 40 23 Dumpstate - Log 9571
3 pages
Agfa Drystar 5500 Image Printer - Software Upgrade
No ratings yet
Agfa Drystar 5500 Image Printer - Software Upgrade
20 pages
Update RS232 TXNR905 E080313
No ratings yet
Update RS232 TXNR905 E080313
3 pages
MM TAXBRA Migracao Batch
No ratings yet
MM TAXBRA Migracao Batch
3 pages
Python: Learn Python in 24 Hours
From Everand
Python: Learn Python in 24 Hours
Alex Nordeen
4/5 (12)
Master Roblox Studio Advanced Game Development Techniques: Roblox Studio, #3
From Everand
Master Roblox Studio Advanced Game Development Techniques: Roblox Studio, #3
Steven Mcananey
No ratings yet
Create 2D Games in Godot 4.4.1
From Everand
Create 2D Games in Godot 4.4.1
Cool Studios
No ratings yet
Panda3d 1.7 Game Developer's Cookbook
From Everand
Panda3d 1.7 Game Developer's Cookbook
Christoph Lang
No ratings yet
CentOS 6 Linux Server Cookbook
From Everand
CentOS 6 Linux Server Cookbook
Jonathan Hobson
No ratings yet
Infrastructure as Code (IAC) Cookbook
From Everand
Infrastructure as Code (IAC) Cookbook
Stephane Jourdan
No ratings yet
Production Ready OpenStack - Recipes for Successful Environments
From Everand
Production Ready OpenStack - Recipes for Successful Environments
Berezin Arthur
No ratings yet
JAVA 9.0 To 13.0 New Features: Learn, Implement and Migrate to New Version of Java.
From Everand
JAVA 9.0 To 13.0 New Features: Learn, Implement and Migrate to New Version of Java.
Mandar Jog
No ratings yet
Docker Networking Cookbook
From Everand
Docker Networking Cookbook
Jon Langemak
No ratings yet
Oracle Ultimate DBA Interview Questions
From Everand
Oracle Ultimate DBA Interview Questions
equitypress
4.5/5 (3)
iOS and OS X Network Programming Cookbook
From Everand
iOS and OS X Network Programming Cookbook
Jon Hoffman
No ratings yet
Azure For Starters
From Everand
Azure For Starters
Chinmoy Mukherjee
No ratings yet
Java 9 Concurrency Cookbook - Second Edition
From Everand
Java 9 Concurrency Cookbook - Second Edition
Javier Fernández González
No ratings yet
Python and SQLite Development
From Everand
Python and SQLite Development
Agus Kurniawan
No ratings yet
The Little Book of Sitecore® Tips: Volume 3
From Everand
The Little Book of Sitecore® Tips: Volume 3
Neil P Shack
5/5 (1)
Spark: Big Data Cluster Computing in Production
From Everand
Spark: Big Data Cluster Computing in Production
Ilya Ganelin
No ratings yet
Puppet for Containerization
From Everand
Puppet for Containerization
Scott Coulton
No ratings yet
Oracle Data Integrator 11g Cookbook
From Everand
Oracle Data Integrator 11g Cookbook
Christophe Dupupet
No ratings yet
Firebase Storage for Angular: A reliable file upload solution for your applications
From Everand
Firebase Storage for Angular: A reliable file upload solution for your applications
Abdelfattah Ragab
No ratings yet
Phaser.js Game Design Workbook: Game development guide using Phaser JavaScript Game Framework
From Everand
Phaser.js Game Design Workbook: Game development guide using Phaser JavaScript Game Framework
Stephen Gose
No ratings yet
eZ Publish 4: Enterprise Web Sites Step-by-Step
From Everand
eZ Publish 4: Enterprise Web Sites Step-by-Step
Francesco Trucchia
No ratings yet
Kali Linux Penetration Testing Bible
From Everand
Kali Linux Penetration Testing Bible
Gus Khawaja
No ratings yet
Godot from Zero to Proficiency (Advanced): Godot from Zero to Proficiency, #1
From Everand
Godot from Zero to Proficiency (Advanced): Godot from Zero to Proficiency, #1
Patrick Felicia
5/5 (1)
The Little Book of Sitecore® Tips: Volume 2
From Everand
The Little Book of Sitecore® Tips: Volume 2
Neil P Shack
No ratings yet
Troubleshooting Ubuntu Server
From Everand
Troubleshooting Ubuntu Server
Bhargav Skanda
No ratings yet
Kubernetes: Build and Deploy Modern Applications in a Scalable Infrastructure. The Complete Guide to the Most Modern Scalable Software Infrastructure.: Docker & Kubernetes, #2
From Everand
Kubernetes: Build and Deploy Modern Applications in a Scalable Infrastructure. The Complete Guide to the Most Modern Scalable Software Infrastructure.: Docker & Kubernetes, #2
Jordan Lioy
No ratings yet
XProc 3.0 Programmer Reference
From Everand
XProc 3.0 Programmer Reference
Erik Siegel
No ratings yet
Docker Tutorial for Beginners: Learn Programming, Containers, Data Structures, Software Engineering, and Coding
From Everand
Docker Tutorial for Beginners: Learn Programming, Containers, Data Structures, Software Engineering, and Coding
Andrew Lee
3/5 (2)
Kubernetes Made Easy
From Everand
Kubernetes Made Easy
Pankaj Joshi
No ratings yet
PostgreSQL 9 Administration Cookbook LITE: Configuration, Monitoring and Maintenance
From Everand
PostgreSQL 9 Administration Cookbook LITE: Configuration, Monitoring and Maintenance
Simon Riggs
3/5 (1)
Learning Powershell DSC: Get started with the fundamentals of PowerShell DSC and utilize its power to automate deployment and configuration of your servers
From Everand
Learning Powershell DSC: Get started with the fundamentals of PowerShell DSC and utilize its power to automate deployment and configuration of your servers
James Pogran
No ratings yet
Oracle: Protect Your Data
From Everand
Oracle: Protect Your Data
Floribert TCHOKO
No ratings yet
Learning Informatica PowerCenter 9.x
From Everand
Learning Informatica PowerCenter 9.x
Rahul Malewar
3/5 (4)
Instant PostgreSQL Backup and Restore How-to
From Everand
Instant PostgreSQL Backup and Restore How-to
Shaun Thomas
No ratings yet
PostgreSQL 9 Administration Cookbook: LITE Edition
From Everand
PostgreSQL 9 Administration Cookbook: LITE Edition
Simon Riggs
3/5 (1)
Performance Project
From Everand
Performance Project
Bruno Skvorc
No ratings yet
Plone 3.3 Site Administration
From Everand
Plone 3.3 Site Administration
Alex Clark
No ratings yet
Action Recognition: Step-by-step Recognizing Actions with Python and Recurrent Neural Network
From Everand
Action Recognition: Step-by-step Recognizing Actions with Python and Recurrent Neural Network
Mark Magic
No ratings yet
Practical Play Framework: Focus on what is really important
From Everand
Practical Play Framework: Focus on what is really important
Alberto Souza
No ratings yet
Using Yocto Project with BeagleBone Black
From Everand
Using Yocto Project with BeagleBone Black
H M Irfan Sadiq
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
RSGallery Plugin 2.1 for Joomla 1.5 Fixes and Installation Guide with Images
From Everand
RSGallery Plugin 2.1 for Joomla 1.5 Fixes and Installation Guide with Images
Daniel Chay
No ratings yet
TensorFlow Developer Certificate Exam Practice Tests 2024 Made Easy
From Everand
TensorFlow Developer Certificate Exam Practice Tests 2024 Made Easy
Mr Troy
No ratings yet
Blood PitTM In-Game Module
From Everand
Blood PitTM In-Game Module
Stephen Gose
No ratings yet
Visual SourceSafe 2005 Software Configuration Management in Practice
From Everand
Visual SourceSafe 2005 Software Configuration Management in Practice
Aleksandar Seovic
No ratings yet
The Mac Terminal Reference and Scripting Primer
From Everand
The Mac Terminal Reference and Scripting Primer
Jay Docherty
4.5/5 (3)
Configuration of a Simple Samba File Server, Quota and Schedule Backup
From Everand
Configuration of a Simple Samba File Server, Quota and Schedule Backup
Dr. Hedaya Alasooly
No ratings yet
50 Recipes for Programming Node.js
From Everand
50 Recipes for Programming Node.js
Jamie Munro
3/5 (4)
Web Scraping for SEO with Python
From Everand
Web Scraping for SEO with Python
Enrique Vicente
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
The Definitive Guide to Getting Started with OpenCart 2.x
From Everand
The Definitive Guide to Getting Started with OpenCart 2.x
iSenseLabs
No ratings yet
DevOps. How to build pipelines with Jenkins, Docker container, AWS ECS, JDK 11, git and maven 3?
From Everand
DevOps. How to build pipelines with Jenkins, Docker container, AWS ECS, JDK 11, git and maven 3?
John Edward Cooper Berg
No ratings yet
DevOps. How To Build Pipelines With Bitbucket Pipelines + Docker Container + AWS ECS + JDK 11 + Maven 3?
From Everand
DevOps. How To Build Pipelines With Bitbucket Pipelines + Docker Container + AWS ECS + JDK 11 + Maven 3?
John Edward Cooper Berg
No ratings yet
The Little Book of Sitecore® Tips: Volume 1
From Everand
The Little Book of Sitecore® Tips: Volume 1
Neil P Shack
No ratings yet
Cisco Packet Tracer for Beginners
From Everand
Cisco Packet Tracer for Beginners
kalyan chinta
5/5 (3)
Make Backup Copies of Video Games, Movies, CD's, & DVD's
From Everand
Make Backup Copies of Video Games, Movies, CD's, & DVD's
Josh Abbott
1/5 (2)
Evaluation of Some Android Emulators and Installation of Android OS on Virtualbox and VMware
From Everand
Evaluation of Some Android Emulators and Installation of Android OS on Virtualbox and VMware
Dr. Hidaia Mahmood Alassouli
No ratings yet
SAS Programming Guidelines Interview Questions You'll Most Likely Be Asked
From Everand
SAS Programming Guidelines Interview Questions You'll Most Likely Be Asked
Vibrant Publishers
No ratings yet
Configuration of a Simple Samba File Server, Quota and Schedule Backup
From Everand
Configuration of a Simple Samba File Server, Quota and Schedule Backup
Dr. Hidaia Mahmood Alassouli
No ratings yet

Codingan Materi

Uploaded by

Codingan Materi

Uploaded by

4/2/24, 5:39 PM Analisis sentimen Gojek V4.

8 | Random Forest - Colaboratory

!umount /kaggle/input/ 2> /dev/null

for data_source_mapping in DATA_SOURCE_MAPPING.split(','):

print('Data source import complete.')

account_circle Downloading gojek-app-reviews-bahasa-indonesia, 8220381 bytes compressed

import numpy as np # linear algebra

# Input data files are available in the read-only "../input/" directory

keyboard_arrow_down Load Data

userName content score at appVersion

Lambat sekali sekarang ini 2021-11-30

Anisa Suci Kenapa sih dari kemarin sy 2021-11-29

Baru download gojek dan hape 2022-09-03

keyboard_arrow_down EDA & Preprocessing

# ambil kolom yg dibutuhkan

userName content score

133 Abu karim aljabbar Mkatiksaidi Ramah banget 5

134 Fathan Mubina Setelah update kok nggak bisa dibuka 4

135 Nyauw Jin Fie Good 5

136 Tanaka Kun Good 5

137 Anton S. Sangat membantu 5

Next steps: toggle_off View recommended plots

[nltk_data] Downloading package stopwords to /root/nltk_data...

133 Abu karim aljabbar Mkatiksaidi ramah banget 5

134 Fathan Mubina update nggak dibuka 4

135 Nyauw Jin Fie good 5

136 Tanaka Kun good 5

137 Anton S. membantu 5

Next steps: toggle_off View recommended plots

!pip install Sastrawi

userName content score

133 Abu karim aljabbar Mkatiksaidi ramah banget 5

134 Fathan Mubina update nggak buka 4

135 Nyauw Jin Fie good 5

136 Tanaka Kun good 5

137 Anton S. bantu 5

Next steps: toggle_off View recommended plots

df['sentimen'] = df['content'].apply(lambda x: 'Positif' if analyzer.polarity_scores(x)['compound'] > 0 else ('Negatif' if analyzer.polarity

userName content score sentimen

Abu karim aljabbar

134 Fathan Mubina update nggak buka 4 Netral

135 Nyauw Jin Fie good 5 Positif

136 Tanaka Kun good 5 Positif

137 Anton S. bantu 5 Netral

... ... ... ... ...

8219 Malik Azis gopay mantap 5 Positif

buka aplnya hapus download beberpa

8222 Melanie Anggi fitur gomed ya 5 Netral

8223 Ade Nurul Hidayah go food mahal ah 1 Negatif

Next steps: toggle_off View recommended plots

keyboard_arrow_down Analisis Sentimen

df_netral = df[df['sentimen'] == 'Netral']

df_negatif = df[df['sentimen'] == 'Negatif']

keyboard_arrow_down Distribusi Target

<Axes: xlabel='sentimen', ylabel='count'>

!pip install palettable

X_train, X_test, y_train, y_test = train_test_split(X_tfidf, df['sentimen'], test_size=0.2, random_state=42)

((6472, 6961), (1618, 6961))

keyboard_arrow_down Resampling target

from imblearn.over_sampling import SMOTE

keyboard_arrow_down Random Forest

keyboard_arrow_down Model Eval

print("\n\nClassification Report for Random Forest (Tuned):")

Classification Report for Random Forest (Tuned):

Negatif 0.84 0.93 0.88 310

You might also like