2016-04-07 22:15:21 +00:00
|
|
|
import configparser, csv, datetime, html.parser, itertools, os, sqlite3, sys, tweepy
|
2015-10-10 22:10:57 +00:00
|
|
|
|
|
|
|
class SetupException(Exception):
|
|
|
|
def __str__(self):
|
|
|
|
return "Seems like config.cfg has not been created yet. Run setup.py to do so."
|
|
|
|
|
|
|
|
|
|
|
|
def getSetting(section, setting):
|
|
|
|
config = configparser.RawConfigParser()
|
|
|
|
config.read('config.cfg')
|
|
|
|
return config.get(section, setting)
|
|
|
|
|
|
|
|
def dbpath():
|
|
|
|
try:
|
|
|
|
return getSetting("Database", "path")
|
|
|
|
except:
|
|
|
|
return "Database.db"
|
|
|
|
|
|
|
|
def cke():
|
|
|
|
try:
|
|
|
|
return getSetting("Twitter", "cke")
|
|
|
|
except:
|
2016-02-08 00:55:12 +00:00
|
|
|
raise SetupException()
|
2015-10-10 22:10:57 +00:00
|
|
|
|
|
|
|
def cse():
|
|
|
|
try:
|
|
|
|
return getSetting("Twitter", "cse")
|
|
|
|
except:
|
2016-02-08 00:55:12 +00:00
|
|
|
raise SetupException()
|
2015-10-10 22:10:57 +00:00
|
|
|
|
|
|
|
def ato():
|
|
|
|
try:
|
|
|
|
return getSetting("Twitter", "ato")
|
|
|
|
except:
|
|
|
|
raise SetupException()
|
|
|
|
|
|
|
|
def ase():
|
|
|
|
try:
|
2016-02-08 00:55:12 +00:00
|
|
|
return getSetting("Twitter", "ase")
|
2015-10-10 22:10:57 +00:00
|
|
|
except:
|
|
|
|
raise SetupException()
|
|
|
|
|
|
|
|
def user():
|
2016-02-08 00:55:12 +00:00
|
|
|
return twObject().whoami()
|
2015-04-21 21:07:25 +00:00
|
|
|
|
|
|
|
|
|
|
|
class dbObject:
|
|
|
|
|
2015-10-10 22:10:57 +00:00
|
|
|
def __init__(self, path=dbpath()):
|
2015-04-21 21:07:25 +00:00
|
|
|
self.conn = sqlite3.connect(path)
|
|
|
|
self.cur = self.conn.cursor()
|
2015-04-22 00:06:32 +00:00
|
|
|
self.path = path
|
2015-04-21 21:07:25 +00:00
|
|
|
|
|
|
|
def closeConnection(self):
|
|
|
|
return self.conn.close()
|
|
|
|
|
|
|
|
def commit(self):
|
|
|
|
return self.conn.commit()
|
|
|
|
|
|
|
|
def executeQuery(self, query):
|
2015-04-28 08:39:30 +00:00
|
|
|
return self.cur.execute(query)
|
2015-04-21 21:07:25 +00:00
|
|
|
|
2015-04-22 00:06:32 +00:00
|
|
|
def getNext(self):
|
|
|
|
return self.cur.fetchone()
|
2015-04-21 21:07:25 +00:00
|
|
|
|
2015-04-21 22:16:42 +00:00
|
|
|
def isInitialized(self):
|
|
|
|
try:
|
|
|
|
self.executeQuery("SELECT * FROM tweets")
|
|
|
|
return True
|
|
|
|
except:
|
|
|
|
return False
|
|
|
|
|
2015-05-14 14:29:55 +00:00
|
|
|
def getFLDate(self, val = 0):
|
|
|
|
if val == 0:
|
|
|
|
mode = "MIN"
|
|
|
|
else:
|
|
|
|
mode = "MAX"
|
|
|
|
|
|
|
|
return getDate(str(list(self.executeQuery("SELECT %s(SUBSTR(timestamp,0,11)) FROM tweets" % mode))[0][0]))
|
|
|
|
|
2015-04-21 22:16:42 +00:00
|
|
|
|
2015-04-22 00:06:32 +00:00
|
|
|
class twObject:
|
|
|
|
|
2015-10-10 22:10:57 +00:00
|
|
|
def __init__(self, cke = cke(), cse = cse(), ato = ato(), ase = ase()):
|
|
|
|
self.auth = tweepy.OAuthHandler(cke, cse)
|
|
|
|
self.auth.set_access_token(ato, ase)
|
2015-04-22 00:06:32 +00:00
|
|
|
self.api = tweepy.API(self.auth)
|
|
|
|
|
2015-10-10 19:15:26 +00:00
|
|
|
def delete(self, id):
|
|
|
|
self.api.destroy_status(id)
|
|
|
|
|
2015-04-22 00:06:32 +00:00
|
|
|
def search(self, query, savepoint = 0):
|
|
|
|
tweets = list(tweepy.Cursor(self.api.search, q=query, since_id=savepoint).items())
|
|
|
|
tweets.reverse()
|
|
|
|
return tweets
|
|
|
|
|
2015-10-10 22:10:57 +00:00
|
|
|
def whoami(self):
|
2016-02-08 00:55:12 +00:00
|
|
|
return self.auth.get_username()
|
2015-10-10 22:10:57 +00:00
|
|
|
|
2015-04-22 00:06:32 +00:00
|
|
|
|
2015-04-21 22:42:20 +00:00
|
|
|
def dbCheck(db, create = False):
|
2015-04-22 00:06:32 +00:00
|
|
|
if (not create and dbInitialized(db)) or (create and not dbInitialized(db)):
|
2015-04-21 22:16:42 +00:00
|
|
|
return True
|
2015-04-21 22:42:20 +00:00
|
|
|
if create:
|
2015-04-22 00:06:32 +00:00
|
|
|
raise ValueError("Provided database file " + db.path + " is already initialized. Remove it manually before trying to recreate it.")
|
|
|
|
raise ValueError("Provided database file " + db.path + " is not initialized. Create it using makedb.py or csvdb.py")
|
2015-04-21 22:16:42 +00:00
|
|
|
|
|
|
|
|
2015-04-21 22:42:20 +00:00
|
|
|
def dbHelper(path, create = False):
|
2015-04-21 22:21:16 +00:00
|
|
|
db = dbObject(path)
|
2015-04-21 22:42:20 +00:00
|
|
|
dbCheck(db, create)
|
2015-04-21 22:21:16 +00:00
|
|
|
return db
|
2015-04-21 22:16:42 +00:00
|
|
|
|
|
|
|
|
2015-04-21 22:21:16 +00:00
|
|
|
def dbInitialized(db):
|
2015-04-21 22:16:42 +00:00
|
|
|
return db.isInitialized()
|
|
|
|
|
2015-04-21 21:07:25 +00:00
|
|
|
|
|
|
|
def fileExists(path):
|
|
|
|
return os.path.isfile(path)
|
|
|
|
|
2015-04-21 22:16:42 +00:00
|
|
|
|
2015-05-14 14:29:55 +00:00
|
|
|
def getDate(date):
|
|
|
|
try:
|
|
|
|
return datetime.datetime.strptime(date, '%Y-%m-%d')
|
|
|
|
except ValueError:
|
|
|
|
raise ValueError("Dates must be in YYYY-MM-DD format.")
|
|
|
|
|
|
|
|
|
2015-05-17 19:33:25 +00:00
|
|
|
def paginate(iterable, page_size):
|
|
|
|
while True:
|
|
|
|
i1, i2 = itertools.tee(iterable)
|
|
|
|
iterable, page = (itertools.islice(i1, page_size, None), list(itertools.islice(i2, page_size)))
|
|
|
|
if len(page) == 0:
|
|
|
|
break
|
|
|
|
yield page
|
|
|
|
|
|
|
|
|
2015-04-21 22:16:42 +00:00
|
|
|
def parseArgs(argv):
|
|
|
|
args = []
|
|
|
|
path = None
|
|
|
|
nextpath = False
|
|
|
|
|
|
|
|
for a in argv[1:]:
|
|
|
|
if nextpath:
|
|
|
|
path = a
|
|
|
|
nextpath = False
|
|
|
|
elif a == "-f":
|
|
|
|
if path != None:
|
|
|
|
raise ValueError("You can only pass one database file.")
|
|
|
|
nextpath = True
|
|
|
|
else:
|
|
|
|
args += [a]
|
|
|
|
|
|
|
|
return args, path
|
2015-04-24 21:33:42 +00:00
|
|
|
|
|
|
|
def printCSV(inlist):
|
|
|
|
writer = csv.writer(sys.stdout)
|
|
|
|
writer.writerows(inlist)
|
|
|
|
|
2016-04-07 22:15:21 +00:00
|
|
|
def unescapeText(text):
|
|
|
|
return html.parser.HTMLParser().unescape(text).replace("'","''")
|
|
|
|
|