···
10
+
class DatabaseWorker(threading.Thread):
11
+
def __init__(self, name, db_path, task_queue):
13
+
self.db_cnx = apsw.Connection(db_path)
14
+
self.db_cnx.pragma('foreign_keys', True)
15
+
self.db_cnx.pragma('journal_mode', 'WAL')
16
+
self.db_cnx.pragma('wal_autocheckpoint', '0')
17
+
self.stop_signal = False
18
+
self.task_queue = task_queue
19
+
self.logger = logging.getLogger(f'feeds.db.{name}')
23
+
while not self.stop_signal:
24
+
task = self.task_queue.get(block=True)
26
+
self.stop_signal = True
27
+
elif task == 'COMMIT':
28
+
self.logger.debug(f'committing {self.changes} changes')
29
+
if self.db_cnx.in_transaction:
30
+
self.db_cnx.execute('COMMIT')
31
+
checkpoint = self.db_cnx.execute('PRAGMA wal_checkpoint(PASSIVE)')
32
+
self.logger.debug(f'checkpoint: {checkpoint.fetchall()!r}')
34
+
self.logger.debug(f'qsize: {self.task_queue.qsize()}')
36
+
sql, bindings = task
37
+
if not self.db_cnx.in_transaction:
38
+
self.db_cnx.execute('BEGIN')
39
+
self.db_cnx.execute(sql, bindings)
40
+
self.changes += self.db_cnx.changes()
41
+
self.task_queue.task_done()
45
+
self.task_queue.put('STOP')
class MostLikedFeed(BaseFeed):
FEED_URI = 'at://did:plc:4nsduwlpivpuur4mqkbfvm6a/app.bsky.feed.generator/most-liked'
10
-
SERVE_FEED_QUERY = """
11
-
select uri, create_ts, unixepoch('now', '-24 hours'), create_ts - unixepoch('now', '-24 hours'), likes
13
-
where create_ts >= unixepoch('now', '-24 hours')
14
-
order by likes desc, create_ts asc
15
-
limit :limit offset :offset
DELETE_OLD_POSTS_QUERY = """
19
-
where create_ts < unixepoch('now', '-24 hours')
50
+
delete from posts where (
51
+
create_ts < unixepoch('now', '-15 minutes') and likes < 2
52
+
) or create_ts < unixepoch('now', '-24 hours');
self.db_cnx = apsw.Connection('db/mostliked.db')
57
+
self.db_cnx.pragma('foreign_keys', True)
self.db_cnx.pragma('journal_mode', 'WAL')
self.db_cnx.pragma('wal_autocheckpoint', '0')
create table if not exists posts (
30
-
uri text, create_ts timestamp, likes int
64
+
uri text primary key,
65
+
create_ts timestamp,
68
+
create table if not exists langs (
71
+
foreign key(uri) references posts(uri) on delete cascade
32
-
create unique index if not exists uri_idx on posts(uri);
33
-
create index if not exists create_ts_idx on posts(create_ts);
73
+
create index if not exists ts_idx on posts(create_ts);
self.logger = logging.getLogger('feeds.mostliked')
78
+
self.db_writes = queue.Queue()
79
+
db_worker = DatabaseWorker('mostliked', 'db/mostliked.db', self.db_writes)
def process_commit(self, commit):
83
+
if commit['opType'] != 'c':
41
-
def delete_old_posts(self):
42
-
self.db_cnx.execute(self.DELETE_OLD_POSTS_QUERY)
43
-
self.logger.debug('deleted {} old posts'.format(self.db_cnx.changes()))
86
+
if commit['collection'] == 'app.bsky.feed.post':
87
+
record = commit.get('record')
88
+
post_uri = f"at://{commit['did']}/app.bsky.feed.post/{commit['rkey']}"
90
+
'insert or ignore into posts (uri, create_ts, likes) values (:uri, :ts, 0)',
91
+
{'uri': post_uri, 'ts': self.safe_timestamp(record.get('createdAt')).timestamp()}
93
+
self.db_writes.put(task)
95
+
langs = record.get('langs', [])
98
+
'insert or ignore into langs (uri, lang) values (:uri, :lang)',
99
+
{'uri': post_uri, 'lang': lang}
101
+
self.db_writes.put(task)
103
+
elif commit['collection'] == 'app.bsky.feed.like':
104
+
record = commit.get('record')
106
+
subject_uri = record['subject']['uri']
111
+
'update posts set likes = likes + 1 where uri = :uri',
112
+
{'uri': subject_uri}
114
+
self.db_writes.put(task)
def commit_changes(self):
46
-
self.delete_old_posts()
47
-
self.logger.debug('committing changes')
48
-
self.transaction_commit(self.db_cnx)
49
-
self.wal_checkpoint(self.db_cnx, 'RESTART')
117
+
self.db_writes.put((self.DELETE_OLD_POSTS_QUERY, {}))
118
+
self.db_writes.put('COMMIT')
120
+
def generate_sql(self, limit, offset, langs):
123
+
select posts.uri, create_ts, create_ts - unixepoch('now', '-15 minutes') as rem, likes, lang
125
+
left join langs on posts.uri = langs.uri
128
+
if not '*' in langs:
129
+
lang_values = list(langs.values())
130
+
bindings.extend(lang_values)
131
+
sql += " OR ".join(['lang = ?'] * len(lang_values))
135
+
order by likes desc, create_ts desc
138
+
bindings.extend([limit, offset])
139
+
return sql, bindings
def serve_feed(self, limit, offset, langs):
53
-
'at://did:plc:4nsduwlpivpuur4mqkbfvm6a/app.bsky.feed.post/3l3cgg5vbc72i'
142
+
sql, bindings = self.generate_sql(limit, offset, langs)
143
+
cur = self.db_cnx.execute(sql, bindings)
144
+
return [row[0] for row in cur]
def serve_feed_debug(self, limit, offset, langs):
147
+
sql, bindings = self.generate_sql(limit, offset, langs)
148
+
return apsw.ext.format_query_table(
149
+
self.db_cnx, sql, bindings,
150
+
string_sanitize=2, text_width=9999, use_unicode=True