AgathaSorceress-mstdn-ebooks/main.py

#!/usr/bin/env python3
# toot downloader version two!!
# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at http://mozilla.org/MPL/2.0/.

from mastodon import Mastodon
from os import path
from bs4 import BeautifulSoup
import os, sqlite3, signal, sys, json, re, shutil, argparse
import requests
import functions

parser = argparse.ArgumentParser(description='Log in and download posts.')
parser.add_argument('-c', '--cfg', dest='cfg', default='config.json', nargs='?',
	help="Specify a custom location for config.json.")

args = parser.parse_args()

scopes = ["read:statuses", "read:accounts", "read:follows", "write:statuses", "read:notifications", "write:accounts"]
#cfg defaults

cfg = {
	"site": "https://botsin.space",
	"cw": None,
	"instance_blacklist": ["bofa.lol", "witches.town", "knzk.me"], # rest in piece
	"learn_from_cw": False,
	"mention_handling": 1,
	"max_thread_length": 15,
	"strip_paired_punctuation": False
}

try:
	cfg.update(json.load(open(args.cfg, 'r')))
except FileNotFoundError:
	open(args.cfg, "w").write("{}")

print("Using {} as configuration file".format(args.cfg))

if "client" not in cfg:
	print("No application info -- registering application with {}".format(cfg['site']))
	client_id, client_secret = Mastodon.create_app("mstdn-ebooks",
		api_base_url=cfg['site'],
		scopes=scopes,
		website="https://github.com/Lynnesbian/mstdn-ebooks")

	cfg['client'] = {
		"id": client_id,
		"secret": client_secret
	}

if "secret" not in cfg:
	print("No user credentials -- logging in to {}".format(cfg['site']))
	client = Mastodon(client_id = cfg['client']['id'],
		client_secret = cfg['client']['secret'],
		api_base_url=cfg['site'])

	print("Open this URL and authenticate to give mstdn-ebooks access to your bot's account: {}".format(client.auth_request_url(scopes=scopes)))
	cfg['secret'] = client.log_in(code=input("Secret: "), scopes=scopes)

json.dump(cfg, open(args.cfg, "w+"))

def extract_toot(toot):
	toot = functions.extract_toot(toot)
	toot = toot.replace("@", "@\u200B") #put a zws between @ and username to avoid mentioning
	return(toot)

client = Mastodon(
	client_id=cfg['client']['id'],
	client_secret = cfg['client']['secret'],
	access_token=cfg['secret'],
	api_base_url=cfg['site'])

me = client.account_verify_credentials()
following = client.account_following(me.id)

db = sqlite3.connect("toots.db")
db.text_factory=str
c = db.cursor()
c.execute("CREATE TABLE IF NOT EXISTS `toots` (sortid INT NOT NULL, id VARCHAR NOT NULL UNIQUE PRIMARY KEY, cw INT NOT NULL DEFAULT 0, userid VARCHAR NOT NULL, uri VARCHAR NOT NULL, content VARCHAR NOT NULL) WITHOUT ROWID")
try:
	c.execute("ALTER TABLE `toots` ADD COLUMN sortid INT NOT NULL")
except:
	pass # column already exists
db.commit()

def handleCtrlC(signal, frame):
	print("\nPREMATURE EVACUATION - Saving chunks")
	db.commit()
	sys.exit(1)

signal.signal(signal.SIGINT, handleCtrlC)

patterns = {
	"handle": re.compile(r"^.*@(.+)"),
	"url": re.compile(r"https?:\/\/(.*)"),
	"uri": re.compile(r'template="([^"]+)"'),
	"pid": re.compile(r"[^\/]+$"),
}


def insert_toot(oii, acc, post, cursor):  # extracted to prevent duplication
	pid = patterns["pid"].search(oii['object']['id']).group(0)
	cursor.execute("REPLACE INTO toots (id, cw, userid, uri, content) VALUES (?, ?, ?, ?, ?)", (
		pid,
		1 if (oii['object']['summary'] != None and oii['object']['summary'] != "") else 0,
		acc.id,
		oii['object']['id'],
		post
	))


for f in following:
	last_toot = c.execute("SELECT id FROM `toots` WHERE userid LIKE ? ORDER BY id DESC LIMIT 1", (f.id,)).fetchone()
	if last_toot != None:
		last_toot = last_toot[0]
	else:
		last_toot = 0
	print("Downloading posts for user @{}, starting from {}".format(f.acct, last_toot))

	#find the user's activitypub outbox
	print("WebFingering...")
	instance = patterns["handle"].search(f.acct)
	if instance == None:
		instance = patterns["url"].search(cfg['site']).group(1)
	else:
		instance = instance.group(1)

	if instance in cfg['instance_blacklist']:
		print("skipping blacklisted instance: {}".format(instance))
		continue

	try:
		# 1. download host-meta to find webfinger URL
		r = requests.get("https://{}/.well-known/host-meta".format(instance), timeout=10)
		# 2. use webfinger to find user's info page
		uri = patterns["uri"].search(r.text).group(1)
		uri = uri.format(uri = "{}@{}".format(f.username, instance))
		r = requests.get(uri, headers={"Accept": "application/json"}, timeout=10)
		j = r.json()
		found = False
		for link in j['links']:
			if link['rel'] == 'self':
				#this is a link formatted like "https://instan.ce/users/username", which is what we need
				uri = link['href']
				found = True
				break
		if not found:
			print("Couldn't find a valid ActivityPub outbox URL.")

		# 3. download first page of outbox
		uri = "{}/outbox?page=true".format(uri)
		r = requests.get(uri, timeout=15)
		j = r.json()
	except:
		print("oopsy woopsy!! we made a fucky wucky!!!\n(we're probably rate limited, please hang up and try again)")
		sys.exit(1)

	pleroma = False
	if 'next' not in j:
		print("Using Pleroma compatibility mode")
		pleroma = True
		j = j['first']
	else:
		print("Using standard mode")
		uri = "{}&min_id={}".format(uri, last_toot)
		r = requests.get(uri)
		j = r.json()

	print("Downloading and saving posts", end='', flush=True)
	done = False
	try:
		while not done and len(j['orderedItems']) > 0:
			for oi in j['orderedItems']:
				if oi['type'] != "Create":
					continue #this isn't a toot/post/status/whatever, it's a boost or a follow or some other activitypub thing. ignore

				# its a toost baby
				content = oi['object']['content']
				toot = extract_toot(content)
				# print(toot)
				try:
					if pleroma:
						if c.execute("SELECT COUNT(*) FROM toots WHERE uri LIKE ?", (oi['object']['id'],)).fetchone()[0] > 0:
							#we've caught up to the notices we've already downloaded, so we can stop now
							#you might be wondering, "lynne, what if the instance ratelimits you after 40 posts, and they've made 60 since main.py was last run? wouldn't the bot miss 20 posts and never be able to see them?" to which i reply, "i know but i don't know how to fix it"
							done = True
					if 'lang' in cfg:
						try:
							if oi['object']['contentMap'][cfg['lang']]: # filter for language
								insert_toot(oi, f, toot, c)
						except KeyError:
							#JSON doesn't have contentMap, just insert the toot irregardlessly
							insert_toot(oi, f, toot, c)
					else:
						insert_toot(oi, f, toot, c)
					pass
				except:
					pass #ignore any toots that don't successfully go into the DB

			# get the next/previous page
			try:
				if not pleroma:
					r = requests.get(j['prev'], timeout=15)
				else:
					r = requests.get(j['next'], timeout=15)
			except requests.Timeout:
				print("HTTP timeout, site did not respond within 15 seconds")
			except:
				print("An error occurred while trying to obtain more posts.")

			j = r.json()
			print('.', end='', flush=True)
		print(" Done!")
		db.commit()
	except requests.HTTPError as e:
		if e.response.status_code == 429:
			print("Rate limit exceeded. This means we're downloading too many posts in quick succession. Saving toots to database and moving to next followed account.")
			db.commit()
		else:
			# TODO: remove duplicate code
			print("Encountered an error! Saving posts to database and moving to next followed account.")
			db.commit()
	except:
		print("Encountered an error! Saving posts to database and moving to next followed account.")
		db.commit()

print("Done!")

db.commit()
db.execute("VACUUM") #compact db
db.commit()
db.close()
initial commit 2018-10-09 03:11:51 +02:00			`#!/usr/bin/env python3`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`# toot downloader version two!!`
initial commit 2018-10-09 03:11:51 +02:00			`# This Source Code Form is subject to the terms of the Mozilla Public`
			`# License, v. 2.0. If a copy of the MPL was not distributed with this`
			`# file, You can obtain one at http://mozilla.org/MPL/2.0/.`

			`from mastodon import Mastodon`
			`from os import path`
			`from bs4 import BeautifulSoup`
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00			`import os, sqlite3, signal, sys, json, re, shutil, argparse`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`import requests`
main.py now uses functions.py's extract_toot func 2019-01-11 13:58:17 +01:00			`import functions`
initial commit 2018-10-09 03:11:51 +02:00
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00			`parser = argparse.ArgumentParser(description='Log in and download posts.')`
fix silly mistake 2019-08-07 05:48:45 +02:00			`parser.add_argument('-c', '--cfg', dest='cfg', default='config.json', nargs='?',`
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00			`help="Specify a custom location for config.json.")`

			`args = parser.parse_args()`

Added the ability to pin and unpin toots with the pin and unpin command. Would like to clean up code as well as possibly toot confirmation and error messages 2019-05-19 14:31:42 +02:00			`scopes = ["read:statuses", "read:accounts", "read:follows", "write:statuses", "read:notifications", "write:accounts"]`
handle cfg defaults better 2019-04-29 05:59:37 +02:00			`#cfg defaults`
Added the ability to pin and unpin toots with the pin and unpin command. Would like to clean up code as well as possibly toot confirmation and error messages 2019-05-19 14:31:42 +02:00
handle cfg defaults better 2019-04-29 05:59:37 +02:00			`cfg = {`
			`"site": "https://botsin.space",`
			`"cw": None,`
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00			`"instance_blacklist": ["bofa.lol", "witches.town", "knzk.me"], # rest in piece`
mention_handling defaults to 1 2019-04-29 06:24:52 +02:00			`"learn_from_cw": False,`
			`"mention_handling": 1,`
added documentation and default value for as of yet unimplemented paired punctuation stripping functionality (#25) 2019-07-01 09:19:52 +02:00			`"max_thread_length": 15,`
			`"strip_paired_punctuation": False`
handle cfg defaults better 2019-04-29 05:59:37 +02:00			`}`
Added the ability to pin and unpin toots with the pin and unpin command. Would like to clean up code as well as possibly toot confirmation and error messages 2019-05-19 14:31:42 +02:00
create config if it doesn't exist 2019-08-14 07:00:35 +02:00			`try:`
			`cfg.update(json.load(open(args.cfg, 'r')))`
			`except FileNotFoundError:`
			`open(args.cfg, "w").write("{}")`
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00
			`print("Using {} as configuration file".format(args.cfg))`
better commenting, handle missing config.json fields 2019-01-11 13:05:29 +01:00
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`if "client" not in cfg:`
easier to understand logging 2019-01-11 13:08:10 +01:00			`print("No application info -- registering application with {}".format(cfg['site']))`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`client_id, client_secret = Mastodon.create_app("mstdn-ebooks",`
			`api_base_url=cfg['site'],`
			`scopes=scopes,`
			`website="https://github.com/Lynnesbian/mstdn-ebooks")`

			`cfg['client'] = {`
			`"id": client_id,`
			`"secret": client_secret`
			`}`

			`if "secret" not in cfg:`
easier to understand logging 2019-01-11 13:08:10 +01:00			`print("No user credentials -- logging in to {}".format(cfg['site']))`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`client = Mastodon(client_id = cfg['client']['id'],`
			`client_secret = cfg['client']['secret'],`
			`api_base_url=cfg['site'])`
initial commit 2018-10-09 03:11:51 +02:00
easier to understand logging 2019-01-11 13:08:10 +01:00			`print("Open this URL and authenticate to give mstdn-ebooks access to your bot's account: {}".format(client.auth_request_url(scopes=scopes)))`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`cfg['secret'] = client.log_in(code=input("Secret: "), scopes=scopes)`
initial commit 2018-10-09 03:11:51 +02:00
allow users to specify custom config.json location 2019-08-07 05:46:57 +02:00			`json.dump(cfg, open(args.cfg, "w+"))`
initial commit 2018-10-09 03:11:51 +02:00
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`def extract_toot(toot):`
main.py now uses functions.py's extract_toot func 2019-01-11 13:58:17 +01:00			`toot = functions.extract_toot(toot)`
actually use ZWS instead of RLE 2018-11-27 12:29:50 +01:00			`toot = toot.replace("@", "@\u200B") #put a zws between @ and username to avoid mentioning`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`return(toot)`
initial commit 2018-10-09 03:11:51 +02:00
			`client = Mastodon(`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`client_id=cfg['client']['id'],`
add config option to filter for language 2019-02-25 19:30:40 +01:00			`client_secret = cfg['client']['secret'],`
			`access_token=cfg['secret'],`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`api_base_url=cfg['site'])`
initial commit 2018-10-09 03:11:51 +02:00
			`me = client.account_verify_credentials()`
			`following = client.account_following(me.id)`

			`db = sqlite3.connect("toots.db")`
			`db.text_factory=str`
			`c = db.cursor()`
add sort id if it doesn't exist 2019-08-14 07:10:53 +02:00			c.execute("CREATE TABLE IF NOT EXISTS `toots` (sortid INT NOT NULL, id VARCHAR NOT NULL UNIQUE PRIMARY KEY, cw INT NOT NULL DEFAULT 0, userid VARCHAR NOT NULL, uri VARCHAR NOT NULL, content VARCHAR NOT NULL) WITHOUT ROWID")
added support for learning from CW'd posts 2019-02-25 02:17:06 +01:00			`try:`
add sort id if it doesn't exist 2019-08-14 07:10:53 +02:00			c.execute("ALTER TABLE `toots` ADD COLUMN sortid INT NOT NULL")
added support for learning from CW'd posts 2019-02-25 02:17:06 +01:00			`except:`
			`pass # column already exists`
initial commit 2018-10-09 03:11:51 +02:00			`db.commit()`

			`def handleCtrlC(signal, frame):`
			`print("\nPREMATURE EVACUATION - Saving chunks")`
			`db.commit()`
			`sys.exit(1)`

			`signal.signal(signal.SIGINT, handleCtrlC)`

precompiled regexes used inside of loop 2019-02-07 16:27:52 +01:00			`patterns = {`
fixed tabs i think hopefully 2019-02-07 16:45:44 +01:00			`"handle": re.compile(r"^.*@(.+)"),`
			`"url": re.compile(r"https?:\/\/(.*)"),`
			`"uri": re.compile(r'template="([^"]+)"'),`
			`"pid": re.compile(r"[^\/]+$"),`
precompiled regexes used inside of loop 2019-02-07 16:27:52 +01:00			`}`
fix for pleroma 2018-10-27 10:28:20 +02:00
add config option to filter for language 2019-02-25 19:30:40 +01:00
			`def insert_toot(oii, acc, post, cursor): # extracted to prevent duplication`
			`pid = patterns["pid"].search(oii['object']['id']).group(0)`
			`cursor.execute("REPLACE INTO toots (id, cw, userid, uri, content) VALUES (?, ?, ?, ?, ?)", (`
			`pid,`
			`1 if (oii['object']['summary'] != None and oii['object']['summary'] != "") else 0,`
			`acc.id,`
			`oii['object']['id'],`
			`post`
			`))`


initial commit 2018-10-09 03:11:51 +02:00			`for f in following:`
			last_toot = c.execute("SELECT id FROM `toots` WHERE userid LIKE ? ORDER BY id DESC LIMIT 1", (f.id,)).fetchone()
			`if last_toot != None:`
			`last_toot = last_toot[0]`
			`else:`
			`last_toot = 0`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`print("Downloading posts for user @{}, starting from {}".format(f.acct, last_toot))`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00
			`#find the user's activitypub outbox`
remove webfingering wikipedia link 2019-02-25 02:18:38 +01:00			`print("WebFingering...")`
fixed tabs i think hopefully 2019-02-07 16:45:44 +01:00			`instance = patterns["handle"].search(f.acct)`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`if instance == None:`
fixed tabs i think hopefully 2019-02-07 16:45:44 +01:00			`instance = patterns["url"].search(cfg['site']).group(1)`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`else:`
			`instance = instance.group(1)`

added instance blacklist 2019-01-11 14:08:53 +01:00			`if instance in cfg['instance_blacklist']:`
			`print("skipping blacklisted instance: {}".format(instance))`
fixed a huge bug 2018-10-25 16:33:57 +02:00			`continue`
more commenting 2019-01-11 13:15:05 +01:00
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`try:`
blacklist knzk.me (rip) 2019-07-01 03:21:08 +02:00			`# 1. download host-meta to find webfinger URL`
added a timeout 2018-10-27 14:07:38 +02:00			`r = requests.get("https://{}/.well-known/host-meta".format(instance), timeout=10)`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`# 2. use webfinger to find user's info page`
fixed tabs i think hopefully 2019-02-07 16:45:44 +01:00			`uri = patterns["uri"].search(r.text).group(1)`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`uri = uri.format(uri = "{}@{}".format(f.username, instance))`
added a timeout 2018-10-27 14:07:38 +02:00			`r = requests.get(uri, headers={"Accept": "application/json"}, timeout=10)`
fix for pleroma 2018-10-27 10:28:20 +02:00			`j = r.json()`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`found = False`
removed hacky solution, added misskey support 2019-02-07 01:53:23 +01:00			`for link in j['links']:`
			`if link['rel'] == 'self':`
			`#this is a link formatted like "https://instan.ce/users/username", which is what we need`
			`uri = link['href']`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`found = True`
			`break`
			`if not found:`
			`print("Couldn't find a valid ActivityPub outbox URL.")`

			`# 3. download first page of outbox`
bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`uri = "{}/outbox?page=true".format(uri)`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`r = requests.get(uri, timeout=15)`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`j = r.json()`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`except:`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`print("oopsy woopsy!! we made a fucky wucky!!!\n(we're probably rate limited, please hang up and try again)")`
			`sys.exit(1)`
fix for pleroma 2018-10-27 10:28:20 +02:00
			`pleroma = False`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`if 'next' not in j:`
			`print("Using Pleroma compatibility mode")`
fix for pleroma 2018-10-27 10:28:20 +02:00			`pleroma = True`
bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`j = j['first']`
had a proper look at the code and fixed it for realsies this time. i'm a dunce. 2018-11-09 12:49:33 +01:00			`else:`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`print("Using standard mode")`
had a proper look at the code and fixed it for realsies this time. i'm a dunce. 2018-11-09 12:49:33 +01:00			`uri = "{}&min_id={}".format(uri, last_toot)`
bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`r = requests.get(uri)`
			`j = r.json()`

code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`print("Downloading and saving posts", end='', flush=True)`
bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`done = False`
restored friendly error messages 2018-11-09 12:50:36 +01:00			`try:`
bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`while not done and len(j['orderedItems']) > 0:`
			`for oi in j['orderedItems']:`
less indentified 2018-11-28 20:36:05 +01:00			`if oi['type'] != "Create":`
more commenting 2019-01-11 13:15:05 +01:00			`continue #this isn't a toot/post/status/whatever, it's a boost or a follow or some other activitypub thing. ignore`
add config option to filter for language 2019-02-25 19:30:40 +01:00
less indentified 2018-11-28 20:36:05 +01:00			`# its a toost baby`
			`content = oi['object']['content']`
			`toot = extract_toot(content)`
			`# print(toot)`
			`try:`
			`if pleroma:`
Fixes for Pleroma: Empty strings mean no CW, `oi['object']['id']` compares to `uri` field in db 2018-12-30 00:58:43 +01:00			`if c.execute("SELECT COUNT(*) FROM toots WHERE uri LIKE ?", (oi['object']['id'],)).fetchone()[0] > 0:`
less indentified 2018-11-28 20:36:05 +01:00			`#we've caught up to the notices we've already downloaded, so we can stop now`
less rude comment 2019-05-06 19:05:02 +02:00			`#you might be wondering, "lynne, what if the instance ratelimits you after 40 posts, and they've made 60 since main.py was last run? wouldn't the bot miss 20 posts and never be able to see them?" to which i reply, "i know but i don't know how to fix it"`
less indentified 2018-11-28 20:36:05 +01:00			`done = True`
fix potential keyerror 2019-07-10 02:43:56 +02:00			`if 'lang' in cfg:`
fix a keyerror 2019-05-06 19:14:30 +02:00			`try:`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`if oi['object']['contentMap'][cfg['lang']]: # filter for language`
fix a keyerror 2019-05-06 19:14:30 +02:00			`insert_toot(oi, f, toot, c)`
			`except KeyError:`
			`#JSON doesn't have contentMap, just insert the toot irregardlessly`
add config option to filter for language 2019-02-25 19:30:40 +01:00			`insert_toot(oi, f, toot, c)`
			`else:`
			`insert_toot(oi, f, toot, c)`
less indentified 2018-11-28 20:36:05 +01:00			`pass`
			`except:`
			`pass #ignore any toots that don't successfully go into the DB`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00
			`# get the next/previous page`
			`try:`
			`if not pleroma:`
			`r = requests.get(j['prev'], timeout=15)`
			`else:`
			`r = requests.get(j['next'], timeout=15)`
			`except requests.Timeout:`
			`print("HTTP timeout, site did not respond within 15 seconds")`
			`except:`
			`print("An error occurred while trying to obtain more posts.")`

bots now work properly with pleroma! 2018-11-07 06:39:12 +01:00			`j = r.json()`
			`print('.', end='', flush=True)`
Version 2.0, with vastly improved toot fetching capabilities! 2018-10-25 04:37:11 +02:00			`print(" Done!")`
			`db.commit()`
added specific error for rate limit exceeded 2019-05-06 19:02:42 +02:00			`except requests.HTTPError as e:`
			`if e.response.status_code == 429:`
			`print("Rate limit exceeded. This means we're downloading too many posts in quick succession. Saving toots to database and moving to next followed account.")`
			`db.commit()`
			`else:`
			`# TODO: remove duplicate code`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`print("Encountered an error! Saving posts to database and moving to next followed account.")`
added specific error for rate limit exceeded 2019-05-06 19:02:42 +02:00			`db.commit()`
restored friendly error messages 2018-11-09 12:50:36 +01:00			`except:`
code cleanup, fixes #23 2019-05-19 15:06:31 +02:00			`print("Encountered an error! Saving posts to database and moving to next followed account.")`
restored friendly error messages 2018-11-09 12:50:36 +01:00			`db.commit()`
only skip failing users, added windows compatibility 2018-11-01 06:27:03 +01:00
			`print("Done!")`
initial commit 2018-10-09 03:11:51 +02:00
			`db.commit()`
			`db.execute("VACUUM") #compact db`
			`db.commit()`
Fixes for Pleroma: Empty strings mean no CW, `oi['object']['id']` compares to `uri` field in db 2018-12-30 00:58:43 +01:00			`db.close()`