-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.py
More file actions
97 lines (72 loc) · 2.7 KB
/
main.py
File metadata and controls
97 lines (72 loc) · 2.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
import argparse
import csv
import logging
import sys
from time import sleep
import scrape
import model
logger = logging.getLogger('mdq')
def load_messages():
try:
with open('messages.csv', 'r') as f:
reader = csv.reader(f, dialect='unix')
return [row for row in reader]
except OSError:
return list()
def dump_messages(messages):
with open('messages.csv', 'w') as f:
writer = csv.writer(f, dialect='unix')
writer.writerows(messages)
def clamp(i, min_, max_):
return max(min_, min(max_, i))
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('-v', '--verbose', action='count', default=0, help='log more info. can be used twice')
actions = parser.add_subparsers(title='action', dest='action')
scrape_parser = actions.add_parser('scrape')
scrape_parser.add_argument('-s', '--start-at-page', type=int, default=1)
build_parser = actions.add_parser('build-model')
say_parser = actions.add_parser('say')
say_parser.add_argument('-c', '--count', type=int, default=1)
args = parser.parse_args()
loglevels = [logging.WARNING, logging.INFO, logging.DEBUG]
logging.basicConfig(level=loglevels[clamp(args.verbose, 0, 2)])
logger.debug(args)
if args.action is None:
parser.print_help()
sys.exit(2)
messages = load_messages()
orig_len = len(messages)
logger.info('Loaded %s donation messages from disk', orig_len)
if args.action == 'scrape':
known_urls = frozenset(message[0] for message in messages)
try:
for url in scrape.get_donation_urls(
start_at_page=args.start_at_page, known=known_urls):
#sleep(.1)
message = scrape.get_message(url)
if message:
messages.append((url, message))
logger.debug('url %s', url)
logger.debug('message %s', message)
if len(messages) % 25 == 0:
dump_messages(messages)
except KeyboardInterrupt:
logger.warning('Received interrupt. Stopping.')
dump_messages(messages)
elif args.action == 'build-model':
m = model.TrigramMarkovChain()
for message in messages:
m.ingest(message[1])
m.save('model.pickle')
elif args.action == 'say':
m = model.TrigramMarkovChain()
try:
m.load('model.pickle')
except OSError:
logger.error('Couldn\'t load model. Did you build the model first?')
sys.exit(1)
for i in range(args.count):
if i > 0:
print(' • • •')
print(m.make_phrase())