Snippets/ShioriFeed.py

389 lines
18 KiB
Python
Raw Normal View History

2023-02-13 13:46:26 +01:00
#!/usr/bin/env python3
2023-02-13 13:58:37 +01:00
# *----------------------------------------------------------------------* #
2023-02-15 17:54:25 +01:00
# | [ ShioriFeed 🔖 (OctoSpacc) ] | #
2023-02-13 13:58:37 +01:00
# | Simple service for getting an Atom/RSS feed from your Shiori profile | #
2023-02-15 17:54:25 +01:00
# *----------------------------------------------------------------------* #
Version = '2023-02-15'
2023-02-13 13:58:37 +01:00
# *----------------------------------------------------------------------* #
2023-02-15 17:54:25 +01:00
# *-------------------------------------------* #
# | Configuration | #
# *-------------------------------------------* #
2023-02-13 13:58:37 +01:00
Host = ('localhost', 8176)
2023-02-14 00:08:27 +01:00
Debug = False
2023-02-15 17:54:25 +01:00
UserAgent = f'ShioriFeed v{Version} at {Host[0]}'
# *-------------------------------------------* #
2023-02-13 13:58:37 +01:00
# External Requirements: urllib3
2023-02-14 00:08:27 +01:00
# TODO:
2023-02-15 17:54:25 +01:00
# - Cheking if Content mode content is actually present, otherwise fall back to Archive mode or original link (using API data is unreliable it seems)
2023-02-14 00:08:27 +01:00
# - Atom feed
# - Actually valid RSS
2023-02-15 17:54:25 +01:00
# - XML stylesheet
# - Filtering (tags, etc.)
2023-02-14 00:08:27 +01:00
# - Write privacy policy
# - Fix the URL copy thing
2023-02-15 17:54:25 +01:00
# - Minification
2023-02-14 00:08:27 +01:00
2023-02-13 13:58:37 +01:00
# *-------------------------------------------------------------------------* #
2023-02-13 13:46:26 +01:00
import traceback
import json
2023-02-15 17:54:25 +01:00
from base64 import urlsafe_b64decode as b64UrlDecode, urlsafe_b64encode as b64UrlEncode, standard_b64encode as b64Encode
2023-02-13 13:58:37 +01:00
from html import escape as HtmlEscape
2023-02-13 13:46:26 +01:00
from http.server import HTTPServer, BaseHTTPRequestHandler
from socketserver import ThreadingMixIn
from urllib.request import urlopen, Request
import threading
2023-02-13 13:58:37 +01:00
HomeTemplate = '''\
2023-02-13 13:46:26 +01:00
<!DOCTYPE html>
2023-02-13 13:58:37 +01:00
<html lang="en">
2023-02-13 13:46:26 +01:00
<head>
2023-02-13 13:58:37 +01:00
<meta charset="UTF-8"/>
2023-02-13 13:46:26 +01:00
<meta name="viewport" content="width=device-width, initial-scale=1.0"/>
2023-02-14 00:08:27 +01:00
<!--
"bookmark" Emoji icon - Copyright 2021 Google Inc. All Rights Reserved.
<https://fonts.google.com/noto/specimen/Noto+Color+Emoji/about>
<https://scripts.sil.org/cms/scripts/page.php?item_id=OFL_web>
-->
<link rel="shortcut icon" type="image/png" href="
2023-02-13 13:58:37 +01:00
<title>ShioriFeed 🔖</title>
<meta name="description" content="Simple service for getting an Atom/RSS feed from your Shiori profile"/>
<meta property="og:title" content="ShioriFeed 🔖"/>
<meta property="og:description" content="Simple service for getting an Atom/RSS feed from your Shiori profile"/>
2023-02-13 13:46:26 +01:00
<style>
2023-02-15 17:54:25 +01:00
:root {
--cFore0: #232323;
--cFore1: #292929;
--cAccent: #f44336;
--cBack0: #e9e9e9;
--cBack1: #ffffff;
/*--cGray: #c9c9c9;*/
}
@media (prefers-color-scheme: dark) {
:root {
--cFore0: #ffffff;
--cFore1: #eeeeee;
--cBack0: #292929;
--cBack1: #1f1f1f;
--cGray: #606060;
}
}
2023-02-13 13:58:37 +01:00
* { box-sizing: border-box; }
2023-02-15 17:54:25 +01:00
.Underline { text-decoration: underline; }
.NoSelect {
user-select: none;
-ms-user-select: none;
-moz-user-select: none;
-khtml-user-select: none;
-webkit-user-select: none;
-webkit-touch-callout: none;
}
2023-02-13 13:46:26 +01:00
body {
2023-02-15 17:54:25 +01:00
color: var(--cFore0);
background: var(--cBack0);
2023-02-14 00:08:27 +01:00
font-family: "Source Sans Pro", sans-serif;
2023-02-13 13:46:26 +01:00
margin: 0px;
padding-top: 24px;
padding-bottom: 24px;
padding-left: 10%;
padding-right: 10%;
2023-02-13 13:58:37 +01:00
word-break: break-word;
2023-02-13 13:46:26 +01:00
}
2023-02-15 17:54:25 +01:00
a { color: var(--cAccent); }
2023-02-13 13:58:37 +01:00
form > label { padding: 8px; }
form > label > span { padding-bottom: 4px; }
form > label, form > label > span {
2023-02-13 13:46:26 +01:00
display: inline-block;
2023-02-13 13:58:37 +01:00
width: 100%;
2023-02-13 13:46:26 +01:00
}
textarea {
width: 100%;
height: 5em;
2023-02-13 13:58:37 +01:00
font-size: large;
2023-02-13 13:46:26 +01:00
resize: none;
}
2023-02-15 17:54:25 +01:00
input { height: 2em; }
input[type="submit"] { font-size: large; }
input, textarea, details { border-radius: 2px; }
input, textarea {
width: 100%;
color: var(--cFore1);
background: var(--cBack1);
border: none;
}
2023-02-13 13:58:37 +01:00
details {
2023-02-15 17:54:25 +01:00
background: var(--cBack1)/*var(--cGray)*/;
2023-02-13 13:58:37 +01:00
padding: 8px;
}
details > summary > h4 { display: inline; }
2023-02-14 00:08:27 +01:00
span.Separator {
display: inline-block;
width: 0.25em;
height: 0.25em;
margin: 0.25em;
vertical-align: middle;
2023-02-15 17:54:25 +01:00
background: var(--cFore1);
2023-02-14 00:08:27 +01:00
}
2023-02-13 13:58:37 +01:00
/* {{PostCss}} */
2023-02-13 13:46:26 +01:00
</style>
</head>
<body>
2023-02-15 17:54:25 +01:00
<div class="NoSelect">
<h2>ShioriFeed 🔖</h2>
<p class="PostObscure">
Enter the details of your account on a
<a href="https://github.com/go-shiori/">Shiori</a>
server to get an Atom/RSS feed link.
</p>
<p class="PostObscure">
<small>Note: still a work-in-progress!</small>
</p>
<br />
<!-- {{PostResult}} -->
<p class="PostObscure">
<form action="./" method="POST">
<label class="PostObscure">
<span>Server <small>(must start with protocol prefix)</small>:</span>
<input type="text" name="Remote" placeholder="http[s]://..."/>
</label>
<br />
<label class="PostObscure">
<span>Username:</span>
<input type="text" name="Username" placeholder="erre"/>
</label>
<br />
<label class="PostObscure">
<span>Password:</span>
<input type="password" name="Password" placeholder="**********"/>
</label>
<br />
<label class="PostObscure">
<span>&nbsp;</span>
<input type="submit" value="Submit"/>
</label>
</form>
</p>
<br />
</div>
2023-02-13 13:58:37 +01:00
<!--
2023-02-15 17:54:25 +01:00
NOTE TO SELF-HOSTERS:
You should probably either adjust or remove this :)
For sure you should at least write your own domain.
-->
2023-02-13 13:46:26 +01:00
<p>
<details>
2023-02-15 17:54:25 +01:00
<summary class="NoSelect">
<!-- Change the domain if self-hosting! -->
2023-02-13 13:58:37 +01:00
<h4>Privacy Policy</h4>
2023-02-15 17:54:25 +01:00
(applies to <em class="Underline">ShioriFeed.Octt.eu.org</em>)
2023-02-13 13:46:26 +01:00
</summary>
2023-02-15 17:54:25 +01:00
<!--<ul>
<li>-->
I still have to write this... tough luck.
I'm not yet actively inviting anyone to use this instance right now,
if you're worried about your security then just host the software yourself.
<!-- </li>
</ul>-->
2023-02-13 13:46:26 +01:00
</details>
</p>
2023-02-15 17:54:25 +01:00
<p class="NoSelect">
<span>v. {{Version}}</span>
2023-02-14 00:08:27 +01:00
<span class="Separator"></span>
2023-02-13 13:46:26 +01:00
<a href="https://gitlab.com/octospacc/Snippets/-/blob/main/ShioriFeed.py">Source Code</a>
</p>
2023-02-13 13:58:37 +01:00
<script>
var Box = document.querySelector('textarea');
if (Box) {
2023-02-14 00:08:27 +01:00
//BoxFocused = false;
2023-02-13 13:58:37 +01:00
Box.value = location.origin + Box.value.substring('http[s]://<THIS SHIORIFEED SERVER ADDRESS>'.length);
2023-02-14 00:08:27 +01:00
//Box.onfocusout = function() { console.log(1); BoxFocused = false; };
//Box.onfocusin = function() { console.log(2); BoxFocused = true; };
Box.onclick = function() {
try {
//if (BoxFocused) {
navigator.clipboard.writeText(Box.value);
alert('Copied to clipboard!');
//};
} catch(e) {};
};
2023-02-13 13:58:37 +01:00
};
</script>
2023-02-13 13:46:26 +01:00
</body>
</html>
2023-02-15 17:54:25 +01:00
'''.replace('{{Version}}', Version)
def RetDebugIf():
return f'\n\n{traceback.format_exc()}' if Debug else ''
2023-02-13 13:46:26 +01:00
2023-02-13 13:58:37 +01:00
def SessionHash(Remote, Username, Password):
return f'{hash(Remote)}{hash(Username)}{hash(Password)}'
2023-02-15 17:54:25 +01:00
def MkFeed(Data, Remote, Username, Session, Type='RSS'):
2023-02-13 13:46:26 +01:00
Feed = ''
2023-02-13 13:58:37 +01:00
Date = Data['bookmarks'][0]['modified'] if Data['bookmarks'] else ''
2023-02-13 13:46:26 +01:00
for Mark in Data['bookmarks']:
2023-02-15 17:54:25 +01:00
Id = Mark['id']
Link = f'{Remote}/bookmark/{Id}/content'
# NOTE: when shiori issue #578 is fixed, this should use a thumb URL from the original article HTML to cope with private bookmarks
Cover = f'<![CDATA[<a href="{Link}"><img src="{Remote}/bookmark/{Id}/thumb"/></a>]]>' if Mark['imageURL'] else ''
# Not so sure about this chief, downloading and embedding EVERY cover image into the XML is slow (~8s per 1 req) and traffic-hungry (~10 simultaneous requests are enough to temporarily DoS the Raspi)
#ImgData = GetContent(Remote, f'bookmark/{Id}/thumb', Session) if Mark['imageURL'] else None
#Cover = f'<![CDATA[<a href="{Link}"><img src="data:{ImgData["Content-Type"]};base64,{b64Encode(ImgData["Body"]).decode()}"/></a><br /><br />]]>' if ImgData else ''
Content = f'{HtmlEscape(GetContent(Remote, f"bookmark/{Id}/content", Session)["Body"].decode())}'
if Type == 'Atom':
Feed += f'''
'''
elif Type == 'RSS':
Feed += f'''
2023-02-13 13:46:26 +01:00
<item>
2023-02-13 13:58:37 +01:00
<title>{HtmlEscape(Mark['title'])}</title>
2023-02-14 00:08:27 +01:00
<description>{Cover}{HtmlEscape(Mark['excerpt'])}</description>
2023-02-15 17:54:25 +01:00
<author>{Mark['author']}</author>
<content:encoded type="text/html">{Content}</content:encoded>
2023-02-14 00:08:27 +01:00
<link>{Link}</link>
2023-02-13 13:46:26 +01:00
<pubDate>{Mark['modified']}</pubDate>
2023-02-15 17:54:25 +01:00
<guid isPermaLink="false">{Link}</guid>
2023-02-13 13:46:26 +01:00
</item>
2023-02-15 17:54:25 +01:00
'''
if Type == 'Atom':
return f'''\
2023-02-13 13:46:26 +01:00
'''
2023-02-15 17:54:25 +01:00
elif Type == 'RSS':
return f'''\
<?xml version="1.0" encoding="utf-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:media="http://search.yahoo.com/mrss/">
2023-02-13 13:46:26 +01:00
<channel>
2023-02-13 13:58:37 +01:00
<title>ShioriFeed ({HtmlEscape(Username)}) 🔖</title>
2023-02-13 13:46:26 +01:00
<pubDate>{Date}</pubDate>
<lastBuildDate>{Date}</lastBuildDate>
{Feed}
</channel>
</rss>
2023-02-15 17:54:25 +01:00
'''
2023-02-13 13:46:26 +01:00
2023-02-15 17:54:25 +01:00
def MkUrl(Post, Type='RSS'):
2023-02-13 13:58:37 +01:00
Args = {}
#Args = Post.split('&')
for Arg in Post.split('&'):
Arg = Arg.split('=')
Args.update({Arg[0]: Arg[1]})
return f'''\
http[s]://<THIS SHIORIFEED SERVER ADDRESS>\
/{Args['Remote']}\
2023-02-15 17:54:25 +01:00
/{b64UrlEncode(Args['Username'].encode()).decode()}\
/{b64UrlEncode(Args['Password'].encode()).decode()}\
2023-02-14 00:08:27 +01:00
/{Type}.xml'''
2023-02-13 13:58:37 +01:00
2023-02-13 13:46:26 +01:00
def GetSession(Remote, Username, Password):
try:
Rq = urlopen(Request(f'{Remote}/api/login',
data=json.dumps({'username': Username, 'password': Password, 'remember': True, 'owner': True}).encode(),
2023-02-15 17:54:25 +01:00
headers={'User-Agent': UserAgent}))
2023-02-13 13:46:26 +01:00
if Rq.code == 200:
2023-02-13 13:58:37 +01:00
Data = {SessionHash(Remote, Username, Password): json.loads(Rq.read().decode())['session']}
2023-02-13 13:46:26 +01:00
Sessions.update(Data)
2023-02-15 17:54:25 +01:00
return {'Code': 200, 'Body': Data}
else:
return {'Code': Rq.code, 'Body': f'[{Rq.code}] External Server Error\n\n{Rq.read().decode()}'}
except Exception:
return {'Code': 500, 'Body': f'[500] Internal Server Error{RetDebugIf()}'}
def GetContent(Remote, Path, Session):
try:
Rq = urlopen(Request(f'{Remote}/{Path}', headers={'X-Session-Id': Session, 'User-Agent': UserAgent}))
if Rq.code == 200:
return {'Code': 200, 'Body': Rq.read(), 'Content-Type': Rq.headers['Content-Type']}
2023-02-13 13:58:37 +01:00
else:
2023-02-15 17:54:25 +01:00
return {'Code': Rq.code, 'Body': f'[{Rq.code}] External Server Error\n\n{Rq.read().decode()}'.encode()}
except Exception:
return {'Code': 500, 'Body': f'[500] Internal Server Error{RetDebugIf()}'.encode()}
2023-02-13 13:46:26 +01:00
def RqHandle(Path, Attempt=0):
try:
2023-02-13 13:58:37 +01:00
Rs = {}
Args = Path.strip().removeprefix('/').removesuffix('/').strip().split('/')
if Args[0] == '':
2023-02-15 17:54:25 +01:00
return {'Code': 200, 'Body': HomeTemplate, 'Content-Type': 'text/html'}
2023-02-13 13:46:26 +01:00
else:
2023-02-14 00:08:27 +01:00
Shift = 1 if Args[-1].lower().startswith(('atom.xml', 'rss.xml')) else 0
Remote = '/'.join(Args[:-(2+Shift)])
2023-02-15 17:54:25 +01:00
Username = b64UrlDecode(Args[-(2+Shift)]).decode()
Password = b64UrlDecode(Args[-(1+Shift)]).decode()
2023-02-13 13:58:37 +01:00
if not SessionHash(Remote, Username, Password) in Sessions:
TrySession = GetSession(Remote, Username, Password)
if TrySession['Code'] != 200:
return TrySession
2023-02-15 17:54:25 +01:00
Session = Sessions[SessionHash(Remote, Username, Password)]
2023-02-13 13:46:26 +01:00
Rq = urlopen(Request(f'{Remote}/api/bookmarks', headers={
2023-02-15 17:54:25 +01:00
'X-Session-Id': Session,
'User-Agent': UserAgent}))
2023-02-13 13:46:26 +01:00
Rs['Code'] = Rq.code
if Rq.code == 200:
2023-02-15 17:54:25 +01:00
# Shiori got us JSON data, parse it and return our result
Rs['Body'] = MkFeed(json.loads(Rq.read().decode()), Remote, Username, Session)
2023-02-13 13:46:26 +01:00
Rs['Content-Type'] = 'application/xml'
elif Rq.code == 500 and Attempt < 1:
2023-02-15 17:54:25 +01:00
# We probably got an expired Session-Id, let's renew it and retry
2023-02-13 13:58:37 +01:00
TrySession = GetSession(Remote, Username, Password)
if TrySession['Code'] != 200:
return TrySession
2023-02-13 13:46:26 +01:00
return ReqHandle(Path, Attempt+1)
else:
Rs['Body'] = f'[{Rq.code}] External Server Error\n\n{Rq.read().decode()}'
2023-02-13 13:58:37 +01:00
return Rs
2023-02-15 17:54:25 +01:00
except Exception:
return {'Code': 500, 'Body': f'[500] Internal Server Error{RetDebugIf()}'}
2023-02-13 13:46:26 +01:00
class Handler(BaseHTTPRequestHandler):
def do_GET(self):
Rs = RqHandle(self.path)
self.send_response(Rs['Code'])
2023-02-13 13:58:37 +01:00
self.send_header('Content-Type', Rs['Content-Type'] if 'Content-Type' in Rs else 'text/plain')
2023-02-13 13:46:26 +01:00
self.end_headers()
self.wfile.write(Rs['Body'].encode())
def do_POST(self):
2023-02-13 13:58:37 +01:00
try:
if self.path == '/':
Body = HomeTemplate.replace('<!-- {{PostResult}} -->', f'''
2023-02-13 13:46:26 +01:00
<p>
2023-02-14 00:08:27 +01:00
Here's your RSS feed:
2023-02-13 13:58:37 +01:00
<textarea readonly="true">{MkUrl(self.rfile.read(int(self.headers['Content-Length'])).decode())}</textarea>
2023-02-13 13:46:26 +01:00
</p>
<br />
2023-02-13 13:58:37 +01:00
''').replace('/* {{PostCss}} */', '.PostObscure { opacity: 0.5; }')
self.send_response(200)
self.send_header('Content-Type', 'text/html')
self.end_headers()
self.wfile.write(Body.encode())
else:
self.send_response(400)
self.send_header('Content-Type', 'text/plain')
self.end_headers()
self.wfile.write(b'[400] Bad Request')
except Exception:
self.send_response(500)
2023-02-13 13:46:26 +01:00
self.send_header('Content-Type', 'text/plain')
self.end_headers()
2023-02-15 17:54:25 +01:00
self.wfile.write((f'[500] Internal Server Error{RetDebugIf()}').encode())
2023-02-13 13:58:37 +01:00
# https://stackoverflow.com/a/3389505
def log_message(self, format, *args):
2023-02-13 13:46:26 +01:00
return
2023-02-13 13:58:37 +01:00
# https://stackoverflow.com/a/51559006
2023-02-13 13:46:26 +01:00
class ThreadedHTTPServer(ThreadingMixIn, HTTPServer):
pass
def Serve():
ThreadedHTTPServer(Host, Handler).serve_forever()
if __name__ == '__main__':
Sessions = {}
try:
Serve()
except KeyboardInterrupt:
pass