twitools/markov.py
2017-02-24 00:14:23 +01:00

50 lines
1.6 KiB
Python
Executable file
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

#!/usr/bin/env python3
import dbtools, setuptools, twitools
import argparse, datetime, html, markovify, nltk, operator, os, random, re, string, sys, time
class Possy(markovify.NewlineText):
def word_split(self, sentence):
words = re.split(self.word_split_pattern, sentence)
words = [ "::".join(tag) for tag in nltk.pos_tag(words) ]
return words
def word_join(self, words):
sentence = " ".join(word.split("::")[0] for word in words)
return sentence
def sanitizeText(text):
split = text.split()
try:
if text[0] == "@" or text[1] == "@":
if split[1][0] not in string.ascii_lowercase:
return sanitizeText(" ".join(split[1:]))
if split[-1][0] == "@":
return sanitizeText(" ".join(split[:-1]))
if text[:4] == "RT @":
return sanitizeText(text.partition(":")[2])
except:
return ""
return text
def getText(db = dbtools.dbHelper()):
text = ""
for string in db.executeQuery('SELECT text FROM tweets;'):
text += sanitizeText(string[0]) + "\n"
return html.unescape("".join([s for s in text.strip().splitlines(True) if s.strip()]))
def markovifyText(text):
return Possy(text).make_short_sentence(130).replace("@", "@")
def getTime(now = datetime.datetime.now()):
thenminute = 15 if now.minute < 15 else 30 if now.minute < 30 else 45 if now.minute < 45 else 0
thenhour = (now.hour + 1 if now.hour < 23 else 0) if thenminute == 0 else now.hour
then = datetime.datetime(now.year, now.month, now.day, thenhour, thenminute, 0)
return (then - datetime.datetime.now()).seconds
if __name__ == "__main__":
text = markovifyText(getText())
time.sleep(getTime())
twitools.tweet(text, section = setuptools.MARKOV)