1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
|
#!/usr/bin/env python
# RSS feed mirror on Misskey
# Copyright (C) 2021 Nguyễn Gia Phong
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published
# by the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this program. If not, see <https://www.gnu.org/licenses/>.
from configparser import ConfigParser
from contextlib import AsyncExitStack
from functools import partial
from re import split, sub
from feedparser import parse
from httpx import AsyncClient, Limits
from loca import Loca
from markdownify import markdownify as md
from trio import open_nursery, run
async def create(client, **note):
"""Create the given note and return its ID."""
response = await client.post('notes/create', json=note)
return response.json()['createdNote']['id']
async def post(job, client, link, title, summary):
"""Post the given entry to Misskey.
In case the link was already posted, the entry shall be skipped.
"""
search = await client.post('notes/search', json={'query': link,
'userId': job['user']})
if search.json(): return
note = partial(create, client, i=job['token'], visibility='home', cw=title)
original = f'Original: {link}'
rest = '\n\n'.join((*map(partial(sub, r'\s+', ' '),
split(r'\s*\n{2,}\s*', md(summary).strip())),
original))
limit = int(job['limit'])
parent = None
while len(rest) > limit:
index = rest.rfind('\n\n', 0, limit+2) # split paragraphs
if index < 0:
index = rest.rfind('. ', 0, limit+1) # split sentences
if index < 0:
parent = await note(text=original, replyId=parent)
return
first, rest = rest[:index+1], rest[index+2:]
else:
first, rest = rest[:index], rest[index+2:]
parent = await note(text=first, replyId=parent)
parent = await note(text=rest, replyId=parent)
async def mirror(nursery, job, client):
"""Perform the given mirror job."""
feed = await client.get(job['source'])
for entry in parse(feed.text)['entries']:
nursery.start_soon(post, job, client, entry['link'],
entry['title'], entry['summary'])
async def main():
"""Parse and run jobs."""
config = ConfigParser()
config.read(Loca().user.config()/'rsskey'/'jobs.conf')
async with AsyncExitStack() as stack, open_nursery() as nursery:
for section in config:
if section == 'DEFAULT': continue
job = config[section]
client = AsyncClient(base_url=job['dest'],
limits=Limits(max_connections=16))
await stack.enter_async_context(client)
nursery.start_soon(mirror, nursery, job, client)
if __name__ == '__main__': run(main)
|