-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathWhatsAppChat.py
40 lines (37 loc) · 1.07 KB
/
WhatsAppChat.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
# -*- coding: utf-8 -*-
"""
Created on Sat Oct 17 06:27:01 2020
#Name: Chaeyoon Kim
#City Email: [email protected]
"""
data = open('WhatsAppChat.txt', 'r', encoding='utf-8', errors='ignore')
stop = open('stopwords.txt','r')
def countWord(data,stop):
word = {}
for line in stop:
words = line.split()
for i in words:
if i in word:
word[i] = word[i] + 1
else:
word[i] = 1
wordDict = {}
for line in data:
lines = line.split()
for i in lines:
i = i.lower().replace("'", "")
if i in wordDict and i not in word:
wordDict[i] = wordDict[i] + 1
else:
wordDict[i] = 1
return (wordDict)
wordDict = countWord(data, stop)
def printTop100(wordDict):
words = list(wordDict.keys())
words.sort(reverse=True, key=lambda v:wordDict[v])
for i in range(100):
word = words[i]
print(i+1, ':', word, '=', wordDict[word])
#---------------------------------------------
top100 = printTop100(wordDict)
print(top100)