-
Notifications
You must be signed in to change notification settings - Fork 13
/
Copy pathmegbotex.py
148 lines (129 loc) · 4.74 KB
/
megbotex.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
#!/usr/bin/python
'''
Author: Megan Ruthven
Date: August 18, 2015
How to use the MegBot summary example:
python megbotex.py [facebook email] [facebook password] [messageID]
'''
import sys
import json
import re
import string
from collections import Counter
from nltk.corpus import stopwords
import time
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait # available since 2.4.0
from selenium.webdriver.support import expected_conditions as EC # available since 2.26.0
from selenium.common.exceptions import StaleElementReferenceException
from selenium.common.exceptions import TimeoutException
import requests
from splinter import Browser
from urllib2 import URLError
from megbot import MegBot
maxMessages = 50;
# attempt to load stopwords
stop = stopwords.words('english')
regex = re.compile('[%s]' % re.escape(string.punctuation));
_intro = "Top words: ";
_megbot_call = "@megbot";
_at_key = "@";
pattern = re.compile("\\b("+_intro+"|"+_megbot_call+")\\W", re.I);
try:
username = sys.argv[1];
password = sys.argv[2];
message = sys.argv[3];
with open('config.json') as in_json:
data = json.load(in_json);
print data;
stop = stop + [word.lower().strip() for word in data['addedStops']];
stop = list(set(stop));
regex = re.compile('[%s]' % re.escape(string.punctuation));
mb = MegBot(username,password);
except IndexError:
print "Usage: python megbotex.py <facebook email> <facebook password> <message ID>";
sys.exit();
print stop;
def next_set(pastMessages):
#checks to see if there are incoming messages. If there are, returns the new ones.
newMessage = [];
end = False;
mb.refresh_messages();
if len(pastMessages) != 0:
print "last line of past messages: " + pastMessages[0];
while len(newMessage) < maxMessages:
outM = mb.read_messages();
print outM;
t = [];
for out in outM:
if _intro in out:
print "found my message";
elif len(pastMessages) == 0 or not any(out == s for s in pastMessages[:min(len(pastMessages), 4)]):
t.append(out);
else:
print "was not an original message";
print "but this was original" + ' '.join(t);
end = True;
break;
newMessage = newMessage+t;
if end:
print "returning now";
return newMessage;
else:
mb.next_page();
return newMessage;
def highest_words(mess):
#cleans, filters out punctuation, and lowers all words in the string in order to count the frequency of each word. Returns top 5 frequent words
oneStr = ' '.join(mess).lower();
inWords = re.sub('[^0-9a-zA-Z]+', ' ', regex.sub('', oneStr)).strip();
totWords = ' '.join([word for word in inWords.split() if word not in stop]);
print totWords;
wordCount = Counter(totWords.split());
print wordCount;
toGoOut = ', '.join([letter for letter, count in wordCount.most_common(5)]);
return toGoOut;
#set up environment
mb.login();
mb.move_to_message(message);
#reading all of the past messages from the group chat
currCheck =[];
currCheck = next_set(currCheck);
currCheck = currCheck[:maxMessages-1];
print currCheck;
ou = highest_words(currCheck);
print ou;
mb.send_message(_intro + ou);
newMess = 0;
filteredAts = [];
while True:
try:
print "checking";
#checking to see if the group message has gotten any more messages from before.
n = next_set(currCheck);
newMess = newMess + len(n);
currCheck = n + currCheck;
print newMess;
print currCheck;
#if the max amount of messages or a @megbot call have come in, summarize the past maxMessages amount of chat and return the top 5 words.
if (newMess) > maxMessages or any( _megbot_call in s for s in currCheck[:len(n)]):
currCheck = currCheck[:maxMessages];
ou = highest_words(currCheck);
mb.send_message(_intro+ou);
newMess = 0;
print "found another message";
#shout out feature. If anyone says "@"xyz that isn't a megbot call. This shouts out the name following the @ in all capitals
if any(_at_key in s for s in currCheck[:len(n)]):
foundShoutOut = ' '.join(currCheck[:len(n)]).split();
for f in foundShoutOut:
if f[0] == _at_key and _megbot_call not in f:
mb.send_message(f[1:].upper());
time.sleep(20);
except (URLError, selenium.common.exceptions.StaleElementReferenceException):
print "reconnecting......";
# Try to reconnect
time.sleep(5)
try:
login();
except:
continue;