kopia lustrzana https://github.com/snarfed/bridgy-fed
107 wiersze
3.8 KiB
Python
107 wiersze
3.8 KiB
Python
"""Simple conneg endpoint that serves AS2 or redirects to to the original post.
|
|
|
|
Serves /r/https://foo.com/bar URL paths, where https://foo.com/bar is an
|
|
original post. Needed for Mastodon interop, they require that AS2 object ids and
|
|
urls are on the same domain that serves them. Background:
|
|
|
|
https://github.com/snarfed/bridgy-fed/issues/16#issuecomment-424799599
|
|
https://github.com/tootsuite/mastodon/pull/6219#issuecomment-429142747
|
|
|
|
The conneg makes these /r/ URLs searchable in Mastodon:
|
|
https://github.com/snarfed/bridgy-fed/issues/352
|
|
"""
|
|
import logging
|
|
import re
|
|
import urllib.parse
|
|
|
|
from flask import g, redirect, request
|
|
from granary import as2
|
|
from negotiator import ContentNegotiator, AcceptParameters, ContentType
|
|
from oauth_dropins.webutil import flask_util, util
|
|
from oauth_dropins.webutil.flask_util import error
|
|
from oauth_dropins.webutil.util import json_dumps, json_loads
|
|
|
|
from activitypub import ActivityPub
|
|
from flask_app import app, cache
|
|
from common import CACHE_TIME, CONTENT_TYPE_HTML
|
|
from models import Object, User
|
|
from web import Web
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
_negotiator = ContentNegotiator(acceptable=[
|
|
AcceptParameters(ContentType(CONTENT_TYPE_HTML)),
|
|
AcceptParameters(ContentType(as2.CONTENT_TYPE)),
|
|
AcceptParameters(ContentType(as2.CONTENT_TYPE_LD)),
|
|
])
|
|
|
|
|
|
@app.get(r'/r/<path:to>')
|
|
@flask_util.cached(cache, CACHE_TIME, headers=['Accept'])
|
|
def redir(to):
|
|
"""Either redirect to a given URL or convert it to another format.
|
|
|
|
E.g. redirects /r/https://foo.com/bar?baz to https://foo.com/bar?baz, or if
|
|
it's requested with AS2 conneg in the Accept header, fetches and converts
|
|
and serves it as AS2.
|
|
"""
|
|
if request.args:
|
|
to += '?' + urllib.parse.urlencode(request.args)
|
|
# some browsers collapse repeated /s in the path down to a single slash.
|
|
# if that happened to this URL, expand it back to two /s.
|
|
to = re.sub(r'^(https?:/)([^/])', r'\1/\2', to)
|
|
|
|
if not util.is_web(to):
|
|
error(f'Expected fully qualified URL; got {to}')
|
|
|
|
to_domain = urllib.parse.urlparse(to).hostname
|
|
|
|
# check conneg
|
|
accept_as2 = False
|
|
accept = request.headers.get('Accept')
|
|
if accept:
|
|
try:
|
|
negotiated = _negotiator.negotiate(accept)
|
|
except ValueError:
|
|
# work around https://github.com/CottageLabs/negotiator/issues/6
|
|
negotiated = None
|
|
if negotiated:
|
|
accept_type = str(negotiated.content_type)
|
|
if accept_type in (as2.CONTENT_TYPE, as2.CONTENT_TYPE_LD):
|
|
accept_as2 = True
|
|
|
|
# check that we've seen this domain before so we're not an open redirect
|
|
domains = set((util.domain_from_link(to, minimize=True),
|
|
util.domain_from_link(to, minimize=False),
|
|
to_domain))
|
|
for domain in domains:
|
|
if domain:
|
|
# TODO(#512): do we need to parameterize this by protocol? or is it
|
|
# only for web?
|
|
g.user = Web.get_by_id(domain)
|
|
if g.user:
|
|
logger.info(f'Found web user for domain {domain}')
|
|
break
|
|
else:
|
|
if accept_as2:
|
|
g.external_user = urllib.parse.urljoin(to, '/')
|
|
logging.info(f'No web user for {g.external_user}')
|
|
else:
|
|
return f'No web user found for any of {domains}', 404
|
|
|
|
if accept_as2:
|
|
# AS2 requested, fetch and convert and serve
|
|
obj = Web.load(to, check_backlink=False)
|
|
if not obj or obj.deleted:
|
|
return f'Object not found: {to}', 404
|
|
ret, _ = ActivityPub.serve(obj)
|
|
logger.info(f'Returning: {json_dumps(ret, indent=2)}')
|
|
return ret, {
|
|
'Content-Type': accept_type,
|
|
'Access-Control-Allow-Origin': '*',
|
|
}
|
|
|
|
# redirect
|
|
logger.info(f'redirecting to {to}')
|
|
return redirect(to, code=301)
|