twitools/markov.py

51 lines
1.6 KiB
Python
Raw Normal View History

2017-02-15 18:09:48 +00:00
#!/usr/bin/env python3
2017-02-18 19:55:06 +00:00
import dbtools, setuptools, twitools
import argparse, datetime, html, markovify, nltk, operator, os, random, re, string, sys, time
2017-02-15 18:09:48 +00:00
2017-02-15 21:19:20 +00:00
class Possy(markovify.NewlineText):
def word_split(self, sentence):
words = re.split(self.word_split_pattern, sentence)
words = [ "::".join(tag) for tag in nltk.pos_tag(words) ]
return words
def word_join(self, words):
sentence = " ".join(word.split("::")[0] for word in words)
return sentence
2017-02-15 18:09:48 +00:00
def sanitizeText(text):
2017-02-21 15:10:39 +00:00
split = text.split()
try:
2017-02-21 15:10:39 +00:00
if "@" in (text[0], text[1]):
if split[1][0] not in string.ascii_lowercase:
return sanitizeText(text.partition(" ")[2])
if split[-1][0] == "@":
return sanitizeText(" ".join(split[:-1]))
if text[:4] == "RT @":
return sanitizeText(text.partition(":")[2])
except:
return ""
return text
2017-02-15 18:09:48 +00:00
def getText(db = dbtools.dbHelper()):
2017-02-15 18:16:19 +00:00
text = ""
2017-02-21 15:10:39 +00:00
for string in db.executeQuery('SELECT text FROM tweets;'):
text += sanitizeText(string[0]) + "\n"
2017-02-16 11:21:25 +00:00
return html.unescape("".join([s for s in text.strip().splitlines(True) if s.strip()]))
2017-02-15 18:09:48 +00:00
2017-02-15 18:16:19 +00:00
def markovifyText(text):
2017-02-15 21:19:20 +00:00
return Possy(text).make_short_sentence(130).replace("@", "@")
2017-02-15 18:09:48 +00:00
def getTime(now = datetime.datetime.now()):
thenminute = 15 if now.minute < 15 else 30 if now.minute < 30 else 45 if now.minute < 45 else 0
thenhour = now.hour + 1 if thenminute == 0 else now.hour
then = datetime.datetime(now.year, now.month, now.day, thenhour, thenminute, 0)
return (then - now).seconds
2017-02-15 18:09:48 +00:00
if __name__ == "__main__":
2017-02-21 15:38:33 +00:00
os.nice(5)
2017-02-21 21:26:09 +00:00
text = markovifyText(getText())
time.sleep(getTime())
2017-02-21 21:26:09 +00:00
twitools.tweet(text, section = setuptools.MARKOV)