Split Data
Split Data
groceries = groceries.split("\n")
groceries_list = []
for i in groceries:
groceries_list.append(i.split(","))
item_frequencies = Counter(all_groceries_list)
# after sorting
item_frequencies = sorted(item_frequencies.items(), key = lambda x:x[1])
# barplot of top 10
import matplotlib.pyplot as plt
groceries_series.columns = ["transactions"]
# creating a dummy columns for the each item in each transactions ... Using column names as
item name
X = groceries_series['transactions'].str.join(sep = '*').str.get_dummies(sep = '*')
ma_X = ma_X.apply(sorted)
rules_sets = list(ma_X)
index_rules = []
for i in unique_rules_sets:
index_rules.append(rules_sets.index(i))
print(text.split())
install.packages("arules")
inspect(movie[1:10])
class(movie)
summary(movie)
# making rules using apriori algorithm
head(quality(arules))
windows()
plot(arules, method = "grouped")
plot(arules[1:10], method = "graph") # for good visualization try plotting only few rules
write(arules, file = "a_rules.csv", sep = ",")
getwd()