0% found this document useful (0 votes)

60 views12 pages

Lampiran 1 Pseudocode COATES Algorithm Dengan Menggunakan Software Python

This Python code implements the COATES document clustering algorithm in three steps: 1. It preprocesses documents, calculates TF-IDF weights, and initializes K-means clustering. 2. It performs the first minor iteration using cosine similarity to assign documents to clusters and update cluster centroids. 3. It performs the second minor iteration by calculating a Gini index to identify discriminative attributes, assigning them to clusters based on probability, and updating cluster centroids again. The code provides outputs at each step and prints the final cluster assignments.

Uploaded by

sofyan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

60 views12 pages

Lampiran 1 Pseudocode COATES Algorithm Dengan Menggunakan Software Python

Uploaded by

sofyan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 12

Lampiran 1

Pseudocode COATES Algorithm dengan menggunakan Software Python

from nltk.tokenize import word_tokenize

from nltk.corpus import stopwords
from nltk.stem import PorterStemmer
import string
import math

def EuclidianDistance (centroid,TFIDF):

temp=0;temp2=[];jarak=[]
for i in range(0,len(centroid)):
for j in range(0,len(TFIDF)):
for k in range(0,len(TFIDF[0])):
temp = temp + math.pow(centroid[i][k]-TFIDF[j][k],2)
temp2.append(math.sqrt(temp))
temp=0
jarak.append(temp2)
temp2=[]
euclid=[]
temp = []
for i in range(0,len(jarak[0])):
for j in range(0,len(jarak)):
temp.append(jarak[j][i])
euclid.append(temp)
temp=[]
return euclid

def CosineSimilarity (centroid,TFIDF):

temp4=[];Cosine=[]
for i in range(0,len(TFIDF)):
for j in range (0,len(centroid)):
temp1=sum([TFIDF[i][k]*centroid[j][k] for k in
range(0,len(TFIDF[0]))])
temp2=math.sqrt(sum([math.pow(TFIDF[i][k],2) for k in
range(0,len(TFIDF[0]))]))
temp3=math.sqrt(sum([math.pow(centroid[j][k],2) for k in
range(0,len(TFIDF[0]))]))
temp4.append(temp1/(temp2*temp3))
Cosine.append(temp4)
temp4=[]
return Cosine

30
def getIndeks(X,Similar,TFIDF):
indeks=[]
for i in range(0,len(TFIDF)):
if X == 0:
indeks.append(Similar[i].index(min(Similar[i])))
else:
indeks.append(Similar[i].index(max(Similar[i])))
return indeks

def readDocument(a,b):
doc=[]
for i in range(a,b):
wordList = [str(i+1),".txt"]
sentence = ""
for i in wordList:
sentence += i
temp2=open(sentence, "r").read()
doc.append(temp2)
return doc

def PreProcessing(corpus):
doc=[];token=[];
stemmer=PorterStemmer()
stop_words=stopwords.words('english')+list(string.punctuation)
count=0
for i in corpus:
count = count+1
temp=word_tokenize(i)#Tokenizing
for j in temp:
if j not in stop_words: #Hilangkan Stop Words
token.append(stemmer.stem(j)) #Stemming&CaseFolding
doc.append(token)
token=[]
return doc

def getDictionary(doc):
dictionary=[]
for i in doc:
for j in i:
if not j in dictionary: #Hilangkan Duplikasi
dictionary.append(j)

31
return dictionary

def getNewCentroid(indeks,TFIDF,K):
jmlclus=[]
for i in range(0,K):
jmlclus.append(indeks.count(i))

idx=[]
for i in range(0,len(indeks)):
idx.append(indeks[i])

temp=[0]*len(TFIDF[0])
centroid=[]
for i in range(0,K):
for j in range(0,jmlclus[i]):
temp=[x + y for x, y in zip(temp,TFIDF[idx.index(i)][:])]
idx[idx.index(i)]=-1
print(' Finding Centroid',i+1,end='')
if jmlclus[i]!=0:
temp2=[z/jmlclus[i] for z in temp]
centroid.append(temp2)
temp=[0]*len(TFIDF[0])
print('...Done!')
return centroid

def printCluster(indeks,K):
print('')
for i in range(0,K):
print('CLUSTER',i+1,':',end='')
for j in range(0,len(indeks)):
if indeks[j] == i:
print(' Doc',j+1,end='')
print('')
print('')

def printme(A,B):
if B == 1:
print(' [',A[0],A[1],A[2],'...',A[len(A)-1],']')
print('')
else:
print(' [',A[0][0],A[0][1],A[0][2],'...',A[0][len(A[0])-1],']')
for i in range(0,3): print(' .')

32
print(' [',A[0][B-1],A[1][B-1],A[2][B-1],'...',A[B-1][len(A[0])-1],']\n')

rawcont = readDocument(0,50)
rawmeta = readDocument(50,100)

print('==============')
print('Term Weightned')
print('==============')

print('1.Pre-Processing',end='')
content = PreProcessing(rawcont)
auxiliary = PreProcessing(rawmeta)
print('...Done')

print('2.Finding Dictionary')
dictcont = getDictionary(content)
print(' Content Dictionary = Vector 1 x',len(dictcont))
printme(A=dictcont,B=1)

dictaux = getDictionary(auxiliary)
print(' Auxiliary Dictionary = Vector 1 x',len(dictaux))
printme(A=dictaux,B=1)

print('3.Finding Term Frequency (TF)',end='')

TF=[];temp=[];count=0
for i in content:
for j in dictcont:
for k in i:
if j==k:
count=count+1
temp.append(count)
count=0
TF.append(temp)
temp=[]
print('...Done')
print(' TF = Matrix',len(TF),'x',len(TF[0]))
printme(A=TF,B=len(TF))

print('4.Finding Document Fequency(DF)',end='')

Freq=[];count=0
for i in range(0,len(TF[0])):
for j in range(0,len(TF)):

33
if TF[j][i]>0:
count=count+1
Freq.append(count)
count=0
print('...Done')
print(' DF = Vector 1 x',len(Freq))
printme(A=Freq,B=1)

print('5.Finding Inverse Document Frequency (IDF)',end='')

IDF=[]
for i in Freq:
x = math.log10(len(content)/i)
IDF.append(x)
print('...Done')
print(' IDF = Vector 1 x',len(IDF))
printme(A=IDF,B=1)

print('6.Finding Weight(TF*IDF)',end='')
TFIDF=[];temp=[]
for i in range(0,len(TF)):
for j in range(0,len(TF[i])):
temp.append(TF[i][j]*IDF[j])
TFIDF.append(temp)
temp=[]
print('...Done')
print(' TFIDF = Matrix',len(TFIDF),'x',len(TFIDF[0]))
printme(A=TFIDF,B=len(TFIDF))

hold = input('Input any value to continue...')

print('\n=====================================')
print('Content Based Algorithm Using K-Means')
print('=====================================')
Iterasi=1
print('ITERATION ',Iterasi)

K=4
print('K =',K)

print('1.Initialize Random Centroid',end='')

centroid=[]
temp = [0,15,26,45]

34
for i in range(0,K):
centroid.append(TFIDF[temp[i]-1])
print('...Done')

print('2.Compute Euclidian Distance',end='')

Euclid = EuclidianDistance(centroid,TFIDF)
print('...Done')

print('3.Assigned Document to Closest Centroid',end='')

indeksKmeans1 = getIndeks(0,Euclid,TFIDF)
print('...Done')

ulang=True
Iterasi=Iterasi+1
while(ulang==True):
print('\nITERATION ',Iterasi)

print('1.Finding New Centroid')

centroid1 = getNewCentroid(indeksKmeans1,TFIDF,K)

print('2.Compute Euclidian Distance Document to New Centroid',end='')

Euclid = EuclidianDistance(centroid1,TFIDF)
print('...Done')

print('3.Assigned Document to New Closest Centroid',end='')

print(' Done!')
indeksKmeans2 = getIndeks (0,Euclid,TFIDF)

if indeksKmeans1 == indeksKmeans2:
print('\nAnggota Cluster Tidak Berubah')
print('Proses Berhenti')
printCluster(indeksKmeans2,K)
ulang=False
else:
print('Anggota Cluster Berubah')
print('Repeat the Process from Step 2')
print('Centroid = New Centroid')
print('')
centroid = centroid1
Iterasi = Iterasi+1

dictclust=[]

35
for i in range(0,K):
temp=[]
for j in range(0,len(indeksKmeans2)):
if indeksKmeans2[j]==i:
for k in content[j]:
if k not in temp:
temp.append(k)
dictclust.append(temp)

print('=====================')
print('First Minor Iteration')
print('=====================')
print('1.Finding Cosine Similarity',end='')
Cosine = CosineSimilarity(centroid1,TFIDF)
print('...Done!')

print('2.Assign Document to Closest Cluster',end='')

indeksFirstIteration = getIndeks(1,Cosine,TFIDF)
print('...Done!')

print('3.Update Cluster Centroid Fisrt Minor Iteration')

centroidFirstIteration = getNewCentroid(indeksFirstIteration,TFIDF,K)
printCluster(indeksFirstIteration,K)

hold = input('Input any value to continue...')

print('======================')
print('Second Minor Iteration')
print('======================')

print('1.Compute Giny Index',end='')

Frj=[];Frm=[];temp=[]
for i in range(0,len(auxiliary)):
for j in range(0,K):
count=0
for k in auxiliary[i]:
if k not in dictclust[j]:
count=count+1
temp.append(count)
count=0
Frj.append(temp)
Frm.append(sum(Frj[i]))

36
temp=[]

Prj=[];temp=[]
for i in range(0,len(Frj)):
for j in range(0,len(Frj[0])):
temp.append(Frj[i][j]/Frm[i])
Prj.append(temp)
temp=[]

Giny=[];temp=[];temp2=[]
for i in range(0,len(Prj)):
for j in range(0,K):
temp.append(math.pow(Prj[i][j],2))
Giny.append(sum(temp))
temp2.append(temp)
temp=[]
print('...Done!')

print('2.Compute Average of Giny Index',end='')

temp=0
for i in range(0,len(Giny)):
temp=temp+Giny[i]
Avg = temp/len(Giny)
print('...Done!')

print('3.Mark Attribute as Discrimanatory',end='')

Disc=[];idxdisc=[];Ri=[]
for i in range(0,len(Giny)):
if Giny[i]<=Avg:
Disc.append(content[i])
Ri.append(i)
print('...Done!')

print('4.Compute Probability of Discriminatory Attribute',end='')

count=0;temp=[];temp2=[]
for i in range(len(Ri)):
for j in range(0,K):
for k in auxiliary[Ri[i]]:
if k in dictclust[j]:
count=count+1
temp.append(count)
count=0

37
temp2.append(temp)
temp=[]
print('...Done!')

print('5.Assigned Discriminatory Attribute to Cluster',end='')

idx=[]
for i in range(0,len(indeksFirstIteration)):
idx.append(indeksFirstIteration[i])

indeksSecondIteration=idx
for j in range(0,len(temp2)):
x = max(temp2[j]) #identify if discriminatory attribute assigned to other
cluster
idxx = temp2[j].index(x)
indeksSecondIteration[Ri[j]]=idxx
print('...Done!')

print('6.Update Cluster Centroid')

centroidSecondIteration = getNewCentroid(indeksSecondIteration,TFIDF,K)
printCluster(indeksSecondIteration,K)

for i in range(0,len(content)):
if indeksFirstIteration[i] != indeksSecondIteration[i]:
print('Doc',i+1,'Move from Cluster',indeksFirstIteration[i]+1,'to
Cluster',indeksSecondIteration[i]+1)

38
Lampiran 2
Hasil Pemrograman :

Python 3.6.0 (v3.6.0:41df79263a11, Dec 23 2016, 07:18:10) [MSC v.1900 32 bit

(Intel)] on win32
Type "copyright", "credits" or "license()" for more information.
>>>
================= RESTART: F:\Fix\ujicobapython3.py ===========
Term Weightned
==============
1.Pre-Processing...Done
2.Finding Dictionary
Content Dictionary = Vector 1 x 14161
[ 1 introduct the ... pilani ]

Auxiliary Dictionary = Vector 1 x 2640

[ review articl monitor ... gist ]

3.Finding Term Frequency (TF)...Done

TF = Matrix 50 x 14161
[ 14 2 36 ... 0 ]
.
.
.
[ 1 0 0 ... 1 ]

4.Finding Document Fequency(DF)...Done

DF = Vector 1 x 14161
[ 50 50 50 ... 1 ]

5.Finding Inverse Document Frequency (IDF)...Done

IDF = Vector 1 x 14161
[ 0.0 0.0 0.0 ... 1.6989700043360187 ]

6.Finding Weight(TF*IDF)...Done
TFIDF = Matrix 50 x 14161
[ 0.0 0.0 0.0 ... 0.0 ]
.
.
.
[ 1.6989700043360187 0.0 0.0 ... 1.6989700043360187 ]
Input any value to continue...

39
=====================================
Content Based Algorithm Using K-Means
=====================================
ITERATION 1
K=4
1.Initialize Random Centroid...Done
2.Compute Euclidian Distance...Done
3.Assigned Document to Closest Centroid...Done

ITERATION 2
1.Finding New Centroid
Finding Centroid 1...Done!
Finding Centroid 2...Done!
Finding Centroid 3...Done!
Finding Centroid 4...Done!
2.Compute Euclidian Distance Document to New Centroid...Done
3.Assigned Document to New Closest Centroid Done!

Anggota Cluster Tidak Berubah

Proses Berhenti

CLUSTER 1 : Doc 32 Doc 50

CLUSTER 2 : Doc 15
CLUSTER 3 : Doc 26
CLUSTER 4 : Doc 1 Doc 2 Doc 3 Doc 4 Doc 5 Doc 6 Doc 7 Doc 8 Doc 9 Doc
10 Doc 11 Doc 12 Doc 13 Doc 14 Doc 16 Doc 17 Doc 18 Doc 19 Doc 20 Doc
21 Doc 22 Doc 23 Doc 24 Doc 25 Doc 27 Doc 28 Doc 29 Doc 30 Doc 31 Doc
33 Doc 34 Doc 35 Doc 36 Doc 37 Doc 38 Doc 39 Doc 40 Doc 41 Doc 42 Doc
43 Doc 44 Doc 45 Doc 46 Doc 47 Doc 48 Doc 49

=====================
First Minor Iteration
=====================
1.Finding Cosine Similarity...Done!
2.Assign Document to Closest Cluster...Done!
3.Update Cluster Centroid Fisrt Minor Iteration
Finding Centroid 1...Done!
Finding Centroid 2...Done!
Finding Centroid 3...Done!
Finding Centroid 4...Done!

40
CLUSTER 1 : Doc 23 Doc 32 Doc 50
CLUSTER 2 : Doc 15
CLUSTER 3 : Doc 26 Doc 33
CLUSTER 4 : Doc 1 Doc 2 Doc 3 Doc 4 Doc 5 Doc 6 Doc 7 Doc 8 Doc 9 Doc
10 Doc 11 Doc 12 Doc 13 Doc 14 Doc 16 Doc 17 Doc 18 Doc 19 Doc 20 Doc
21 Doc 22 Doc 24 Doc 25 Doc 27 Doc 28 Doc 29 Doc 30 Doc 31 Doc 34 Doc
35 Doc 36 Doc 37 Doc 38 Doc 39 Doc 40 Doc 41 Doc 42 Doc 43 Doc 44 Doc
45 Doc 46 Doc 47 Doc 48 Doc 49

Input any value to continue...

======================
Second Minor Iteration
======================
1.Compute Giny Index...Done!
2.Compute Average of Giny Index...Done!
3.Mark Attribute as Discrimanatory...Done!
4.Compute Probability of Discriminatory Attribute...Done!
5.Assigned Discriminatory Attribute to Cluster...Done!
6.Update Cluster Centroid
Finding Centroid 1...Done!
Finding Centroid 2...Done!
Finding Centroid 3...Done!
Finding Centroid 4...Done!
CLUSTER 1 : Doc 32 Doc 50
CLUSTER 2 :
CLUSTER 3 : Doc 33
CLUSTER 4 : Doc 1 Doc 2 Doc 3 Doc 4 Doc 5 Doc 6 Doc 7 Doc 8 Doc 9 Doc
10 Doc 11 Doc 12 Doc 13 Doc 14 Doc 15 Doc 16 Doc 17 Doc 18 Doc 19 Doc
20 Doc 21 Doc 22 Doc 23 Doc 24 Doc 25 Doc 26 Doc 27 Doc 28 Doc 29 Doc
30 Doc 31 Doc 34 Doc 35 Doc 36 Doc 37 Doc 38 Doc 39 Doc 40 Doc 41 Doc
42 Doc 43 Doc 44 Doc 45 Doc 46 Doc 47 Doc 48 Doc 49

Doc 15 Move from Cluster 2 to Cluster 4

Doc 23 Move from Cluster 1 to Cluster 4
Doc 26 Move from Cluster 3 to Cluster 4

Uol Algorithms
No ratings yet
Uol Algorithms
215 pages
Quantitative Analyst
0% (1)
Quantitative Analyst
12 pages
Big O Notation
100% (1)
Big O Notation
19 pages
Intelligent Maze Solving Robot Based On Image Processing and Graph Theory Algorithms
No ratings yet
Intelligent Maze Solving Robot Based On Image Processing and Graph Theory Algorithms
7 pages
Spelling Correction: Edit Distance: Pawan Goyal
No ratings yet
Spelling Correction: Edit Distance: Pawan Goyal
67 pages
Mid Point Line Drawing Algorithm
100% (3)
Mid Point Line Drawing Algorithm
8 pages
07 Network Flow I
No ratings yet
07 Network Flow I
96 pages
T 5 Open Methods
No ratings yet
T 5 Open Methods
58 pages
Personal Financial Report: Category Jan Feb Mar
No ratings yet
Personal Financial Report: Category Jan Feb Mar
56 pages
Integers, Power and Roots A. Arithmatic Integers
No ratings yet
Integers, Power and Roots A. Arithmatic Integers
4 pages
Operation Research Lab Manual - Lab 03
No ratings yet
Operation Research Lab Manual - Lab 03
5 pages
QA Assignment 02
No ratings yet
QA Assignment 02
2 pages
20HCC22XX: B.Tech (III Sem)
No ratings yet
20HCC22XX: B.Tech (III Sem)
2 pages
RPP SPLDV Bab-5
No ratings yet
RPP SPLDV Bab-5
22 pages
Describe Θ (N*Logn) -Time Algorithm That, Given A Set S Of N Integers And Another Integer X, Determines Whether Or Not There Exist Two Elements In S Whose Sum Is Exactly X
No ratings yet
Describe Θ (N*Logn) -Time Algorithm That, Given A Set S Of N Integers And Another Integer X, Determines Whether Or Not There Exist Two Elements In S Whose Sum Is Exactly X
8 pages
Program 1
No ratings yet
Program 1
25 pages
421MA2176 Lab 5 and 6
No ratings yet
421MA2176 Lab 5 and 6
12 pages
Dictionary: Dict ('Name': 'Geeks', 1: (1, 2, 3, 4) )
No ratings yet
Dictionary: Dict ('Name': 'Geeks', 1: (1, 2, 3, 4) )
14 pages
An Improved Regula Falsi Method For Finding Simple Zeros of Nonlinear Equations
No ratings yet
An Improved Regula Falsi Method For Finding Simple Zeros of Nonlinear Equations
6 pages
Chapter 07 Deadlocks
No ratings yet
Chapter 07 Deadlocks
11 pages
ML Lab
No ratings yet
ML Lab
24 pages
Final Ppts Daa Unit III Dynamic Programming
No ratings yet
Final Ppts Daa Unit III Dynamic Programming
36 pages
Ex 1 A Numpy Ex
No ratings yet
Ex 1 A Numpy Ex
2 pages
Sigma Notation Area As A Limit
No ratings yet
Sigma Notation Area As A Limit
2 pages
Radix Sort - Wikipedia, The Free Encyclopedia
No ratings yet
Radix Sort - Wikipedia, The Free Encyclopedia
13 pages
NUMBER
No ratings yet
NUMBER
1 page
Codewriting Solutions Python
100% (4)
Codewriting Solutions Python
25 pages
Data Structures and Algorithms - 2018
No ratings yet
Data Structures and Algorithms - 2018
2 pages
Cambridge Lower Secondary Mathematics
No ratings yet
Cambridge Lower Secondary Mathematics
1 page
Assignment 1 & 2
No ratings yet
Assignment 1 & 2
2 pages
Daftar Pustaka
No ratings yet
Daftar Pustaka
1 page
Tutorial Discrete Maths
No ratings yet
Tutorial Discrete Maths
7 pages
Binary Search Algorithm
100% (1)
Binary Search Algorithm
12 pages
Web Mining DA
No ratings yet
Web Mining DA
13 pages
ML Lab Programs 1-10-Converted NAM COLLEGE PDF
No ratings yet
ML Lab Programs 1-10-Converted NAM COLLEGE PDF
33 pages
DVP 1
No ratings yet
DVP 1
24 pages
Task 5
No ratings yet
Task 5
3 pages
FDS All Practicals
No ratings yet
FDS All Practicals
10 pages
ML Lab Programs
No ratings yet
ML Lab Programs
21 pages
Machine Learning Through Python Lab Mannual
No ratings yet
Machine Learning Through Python Lab Mannual
33 pages
Machine Learning Lab Manual
No ratings yet
Machine Learning Lab Manual
26 pages
ML Lab Prog1-5 (5) College PDF
No ratings yet
ML Lab Prog1-5 (5) College PDF
12 pages
96 Yogesh Khairnar Assignment 4
No ratings yet
96 Yogesh Khairnar Assignment 4
25 pages
Chapter 5 EX
No ratings yet
Chapter 5 EX
10 pages
ML Lab Manual
No ratings yet
ML Lab Manual
90 pages
15CSL76 Students
No ratings yet
15CSL76 Students
18 pages
Col100 Assignment 2 - Computer Science Iitd Assignmets
No ratings yet
Col100 Assignment 2 - Computer Science Iitd Assignmets
6 pages
Mini Project
No ratings yet
Mini Project
7 pages
IR - 754 All Practical
No ratings yet
IR - 754 All Practical
21 pages
8.2.la Culpa Es de La Vaca 2 (Jaime Lopera)
No ratings yet
8.2.la Culpa Es de La Vaca 2 (Jaime Lopera)
407 pages
ML Lab Programs
No ratings yet
ML Lab Programs
15 pages
DVP 2
No ratings yet
DVP 2
10 pages
ML1 3 Merged
No ratings yet
ML1 3 Merged
19 pages
Dslall 13 Code
No ratings yet
Dslall 13 Code
92 pages
Answer Key AI
No ratings yet
Answer Key AI
23 pages
LPCC Assignment 5
No ratings yet
LPCC Assignment 5
8 pages
23 Final Solution
No ratings yet
23 Final Solution
7 pages
Dvpy Lab Exam
No ratings yet
Dvpy Lab Exam
13 pages
Program Imp
No ratings yet
Program Imp
5 pages
CLASS XII RECORD Computer
No ratings yet
CLASS XII RECORD Computer
14 pages
HW1
No ratings yet
HW1
2 pages
DWM Final Exps
No ratings yet
DWM Final Exps
14 pages
Deep Learning Lab Manual
No ratings yet
Deep Learning Lab Manual
46 pages
ML Lab Manual-99
No ratings yet
ML Lab Manual-99
23 pages
‎⁨ דף נוסחאות מדמח סופי⁩
No ratings yet
‎⁨ דף נוסחאות מדמח סופי⁩
2 pages
Module 2 Devide&Conquer
No ratings yet
Module 2 Devide&Conquer
48 pages
Unit 5 Binary Trees
No ratings yet
Unit 5 Binary Trees
28 pages
Python Alpn 10
No ratings yet
Python Alpn 10
20 pages
S4 - CNC Tsi 2020 - Youness 06 78 26 25 20
No ratings yet
S4 - CNC Tsi 2020 - Youness 06 78 26 25 20
5 pages
דף נוסחאות יסודות מדמח
No ratings yet
דף נוסחאות יסודות מדמח
4 pages
CNC2024 Corrigé
No ratings yet
CNC2024 Corrigé
3 pages
Lab3 202301445 CT
No ratings yet
Lab3 202301445 CT
12 pages
AIML Prograns
No ratings yet
AIML Prograns
6 pages
Python Programming
No ratings yet
Python Programming
15 pages
Rishabh Raj SCLD El Kmap
No ratings yet
Rishabh Raj SCLD El Kmap
16 pages
Python
No ratings yet
Python
4 pages
Ada Lab MANUAL Updated
No ratings yet
Ada Lab MANUAL Updated
30 pages
TP 4
No ratings yet
TP 4
3 pages
IR Prac 2
No ratings yet
IR Prac 2
4 pages
List of Experiments
No ratings yet
List of Experiments
2 pages
Lab 1 Python
No ratings yet
Lab 1 Python
5 pages
IR
No ratings yet
IR
12 pages
ML Lab Assignment2
No ratings yet
ML Lab Assignment2
9 pages
MATH Lab Final Code
No ratings yet
MATH Lab Final Code
10 pages
DC2 2023 Correction
No ratings yet
DC2 2023 Correction
4 pages
Wa0027.
No ratings yet
Wa0027.
34 pages
Untitled Document
No ratings yet
Untitled Document
15 pages
AIML Final Programs
No ratings yet
AIML Final Programs
8 pages
Codingan Fisika
No ratings yet
Codingan Fisika
11 pages
Ailmml
No ratings yet
Ailmml
1 page
ML Lab File Batch 1
No ratings yet
ML Lab File Batch 1
20 pages
Heuristic Search
No ratings yet
Heuristic Search
8 pages
Ai Lab
No ratings yet
Ai Lab
11 pages
Codes
No ratings yet
Codes
6 pages
Ex 2
No ratings yet
Ex 2
6 pages
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
From Everand
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
Mohmmad Khaja Shareef
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

Lampiran 1 Pseudocode COATES Algorithm Dengan Menggunakan Software Python

Uploaded by

Lampiran 1 Pseudocode COATES Algorithm Dengan Menggunakan Software Python

Uploaded by

Lampiran 1

Pseudocode COATES Algorithm dengan menggunakan Software Python

from nltk.tokenize import word_tokenize

def EuclidianDistance (centroid,TFIDF):

def CosineSimilarity (centroid,TFIDF):

print('3.Finding Term Frequency (TF)',end='')

print('4.Finding Document Fequency(DF)',end='')

print('5.Finding Inverse Document Frequency (IDF)',end='')

hold = input('Input any value to continue...')

print('1.Initialize Random Centroid',end='')

print('2.Compute Euclidian Distance',end='')

print('3.Assigned Document to Closest Centroid',end='')

print('1.Finding New Centroid')

print('2.Compute Euclidian Distance Document to New Centroid',end='')

print('3.Assigned Document to New Closest Centroid',end='')

print('2.Assign Document to Closest Cluster',end='')

print('3.Update Cluster Centroid Fisrt Minor Iteration')

hold = input('Input any value to continue...')

print('1.Compute Giny Index',end='')

print('2.Compute Average of Giny Index',end='')

print('3.Mark Attribute as Discrimanatory',end='')

print('4.Compute Probability of Discriminatory Attribute',end='')

print('5.Assigned Discriminatory Attribute to Cluster',end='')

print('6.Update Cluster Centroid')

Python 3.6.0 (v3.6.0:41df79263a11, Dec 23 2016, 07:18:10) [MSC v.1900 32 bit

Auxiliary Dictionary = Vector 1 x 2640

3.Finding Term Frequency (TF)...Done

4.Finding Document Fequency(DF)...Done

5.Finding Inverse Document Frequency (IDF)...Done

Anggota Cluster Tidak Berubah

CLUSTER 1 : Doc 32 Doc 50

Input any value to continue...

Doc 15 Move from Cluster 2 to Cluster 4

You might also like