telematrix/app_service.py

510 lines
18 KiB
Python
Raw Normal View History

2016-09-26 03:52:59 +02:00
"""
Telematrix
App service for Matrix to bridge a room with a Telegram group.
"""
2016-09-13 16:17:11 +02:00
import asyncio
2016-09-26 03:52:59 +02:00
import html
import json
2016-09-13 16:17:11 +02:00
import logging
import mimetypes
2016-09-26 03:52:59 +02:00
from datetime import datetime
from time import time
2016-09-13 16:17:11 +02:00
from urllib.parse import unquote, quote, urlparse, parse_qs
2016-09-26 03:52:59 +02:00
from aiohttp import web, ClientSession
from aiotg import Bot
2016-09-13 16:17:11 +02:00
from bs4 import BeautifulSoup
import database as db
2016-09-26 03:52:59 +02:00
# Read the configuration file
2016-09-13 16:17:11 +02:00
try:
2016-09-26 03:52:59 +02:00
with open('config.json', 'r') as config_file:
CONFIG = json.load(config_file)
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
HS_TOKEN = CONFIG['tokens']['hs']
AS_TOKEN = CONFIG['tokens']['as']
TG_TOKEN = CONFIG['tokens']['telegram']
try:
GOOGLE_TOKEN = CONFIG['tokens']['google']
except KeyError:
GOOGLE_TOKEN = None
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
MATRIX_HOST = CONFIG['hosts']['internal']
MATRIX_HOST_EXT = CONFIG['hosts']['external']
MATRIX_HOST_BARE = CONFIG['hosts']['bare']
2016-09-13 16:17:11 +02:00
MATRIX_PREFIX = MATRIX_HOST + '_matrix/client/r0/'
MATRIX_MEDIA_PREFIX = MATRIX_HOST + '_matrix/media/r0/'
2016-09-26 03:52:59 +02:00
USER_ID_FORMAT = CONFIG['user_id_format']
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
TELEGRAM_CHATS = CONFIG['chats']
MATRIX_ROOMS = {v: k for k, v in TELEGRAM_CHATS.items()}
DATABASE_URL = CONFIG['db_url']
2016-09-26 03:52:59 +02:00
except (OSError, IOError) as exception:
2016-09-13 16:17:11 +02:00
print('Error opening config file:')
2016-09-26 03:52:59 +02:00
print(exception)
2016-09-13 16:17:11 +02:00
exit(1)
2016-09-26 03:52:59 +02:00
GOO_GL_URL = 'https://www.googleapis.com/urlshortener/v1/url'
TG_BOT = Bot(api_token=TG_TOKEN)
MATRIX_SESS = ClientSession()
SHORTEN_SESS = ClientSession()
2016-09-13 16:17:11 +02:00
def create_response(code, obj):
2016-09-26 03:52:59 +02:00
"""
Create an HTTP response with a JSON body.
:param code: The status code of the response.
:param obj: The object to serialize and include in the response.
:return: A web.Response.
"""
return web.Response(text=json.dumps(obj), status=code,
content_type='application/json', charset='utf-8')
2016-09-13 16:17:11 +02:00
VALID_TAGS = ['b', 'strong', 'i', 'em', 'a', 'pre']
2016-09-26 03:52:59 +02:00
def sanitize_html(string):
"""
Sanitize an HTML string for the Telegram bot API.
:param string: The HTML string to sanitized.
:return: The sanitized HTML string.
"""
string = string.replace('<br>', '\n').replace('<br/>', '\n') \
.replace('<br />', '\n')
soup = BeautifulSoup(string, 'html.parser')
2016-09-13 16:17:11 +02:00
for tag in soup.find_all(True):
if tag.name == 'blockquote':
tag.string = ('\n' + tag.text).replace('\n', '\n> ').rstrip('\n>')
if tag.name not in VALID_TAGS:
tag.hidden = True
return soup.renderContents().decode('utf-8')
2016-09-26 03:52:59 +02:00
def format_matrix_msg(form, username, content):
"""
Formats a matrix message for sending to Telegram
:param form: The format string of the message, where the first parameter
is the username and the second one the message.
:param username: The username of the user.
:param content: The content to be sent.
:return: The formatted string.
"""
if 'format' in content and content['format'] == 'org.matrix.custom.html':
sanitized = sanitize_html(content['formatted_body'])
return html.escape(form).format(username, sanitized), 'HTML'
else:
return form.format(username, content['body']), None
async def download_matrix_file(url, filename):
"""
Download a file from an MXC URL to /tmp/{filename}
:param url: The MXC URL to download from.
:param filename: The filename in /tmp/ to download into.
"""
m_url = MATRIX_MEDIA_PREFIX + 'download/{}{}'.format(url.netloc, url.path)
async with MATRIX_SESS.get(m_url) as response:
data = await response.read()
with open('/tmp/{}'.format(filename), 'wb') as file:
file.write(data)
async def shorten_url(url):
"""
Shorten an URL using goo.gl. Returns the original URL if it fails.
:param url: The URL to shorten.
:return: The shortened URL.
"""
if not GOOGLE_TOKEN:
return url
2016-09-26 03:52:59 +02:00
headers = {'Content-Type': 'application/json'}
async with SHORTEN_SESS.post(GOO_GL_URL, params={'key': GOOGLE_TOKEN},
2016-11-14 11:07:26 +01:00
data=json.dumps({'longUrl': url}),
2016-09-26 04:11:18 +02:00
headers=headers) \
2016-09-26 03:52:59 +02:00
as response:
2016-09-26 04:11:18 +02:00
obj = await response.json()
2016-09-26 03:52:59 +02:00
2016-09-26 04:11:18 +02:00
if 'id' in obj:
return obj['id']
else:
return url
2016-09-26 03:52:59 +02:00
def matrix_is_telegram(user_id):
username = user_id.split(':')[0][1:]
return username.startswith('telegram_')
def get_username(user_id):
return user_id.split(':')[0][1:]
2016-09-26 03:52:59 +02:00
2016-09-13 16:17:11 +02:00
async def matrix_transaction(request):
2016-09-26 03:52:59 +02:00
"""
Handle a transaction sent by the homeserver.
:param request: The request containing the transaction.
:return: The response to send.
"""
2016-09-13 16:17:11 +02:00
body = await request.json()
events = body['events']
for event in events:
print(event)
if event['type'] == 'm.room.aliases':
aliases = event['content']['aliases']
links = db.session.query(db.ChatLink)\
.filter_by(matrix_room=event['room_id']).all()
for link in links:
db.session.delete(link)
for alias in aliases:
print(alias)
if alias.split('_')[0] != '#telegram' \
or alias.split(':')[-1] != MATRIX_HOST_BARE:
continue
tg_id = alias.split('_')[1].split(':')[0]
link = db.ChatLink(event['room_id'], tg_id, True)
db.session.add(link)
db.session.commit()
continue
link = db.session.query(db.ChatLink)\
.filter_by(matrix_room=event['room_id']).first()
if not link:
print('{} isn\'t linked!'.format(event['room_id']))
continue
group = TG_BOT.group(link.tg_room)
if event['type'] == 'm.room.message':
user_id = event['user_id']
if matrix_is_telegram(user_id):
continue
sender = db.session.query(db.MatrixUser)\
.filter_by(matrix_id=user_id).first()
if not sender:
response = await matrix_get('client', 'profile/{}/displayname'
.format(user_id), None)
try:
displayname = response['displayname']
except KeyError:
displayname = get_username(user_id)
sender = db.MatrixUser(user_id, displayname)
db.session.add(sender)
else:
displayname = sender.name or get_username(user_id)
2016-09-13 16:17:11 +02:00
content = event['content']
2016-09-13 16:17:11 +02:00
if content['msgtype'] == 'm.text':
msg, mode = format_matrix_msg('<{}> {}', displayname, content)
2016-09-26 03:52:59 +02:00
await group.send_text(msg, parse_mode=mode)
2016-09-13 16:17:11 +02:00
elif content['msgtype'] == 'm.notice':
msg, mode = format_matrix_msg('[{}] {}', displayname, content)
2016-09-26 03:52:59 +02:00
await group.send_text(msg, parse_mode=mode)
2016-09-13 16:17:11 +02:00
elif content['msgtype'] == 'm.emote':
msg, mode = format_matrix_msg('* {} {}', displayname, content)
2016-09-26 03:52:59 +02:00
await group.send_text(msg, parse_mode=mode)
2016-09-13 16:17:11 +02:00
elif content['msgtype'] == 'm.image':
url = urlparse(content['url'])
2016-09-26 11:30:39 +02:00
await download_matrix_file(url, content['body'])
2016-09-26 03:52:59 +02:00
with open('/tmp/{}'.format(content['body']), 'rb') as img_file:
url_str = MATRIX_HOST_EXT + \
'_matrix/media/r0/download/{}{}' \
.format(url.netloc, quote(url.path))
url_str = await shorten_url(url_str)
2016-09-26 03:52:59 +02:00
caption = '<{}> {} ({})'.format(displayname,
content['body'], url_str)
2016-09-26 03:52:59 +02:00
await group.send_photo(img_file, caption=caption)
2016-09-13 16:17:11 +02:00
else:
2016-09-26 11:59:38 +02:00
print('Unsupported message type {}'.format(content['msgtype']))
2016-09-13 16:17:11 +02:00
print(json.dumps(content, indent=4))
elif event['type'] == 'm.room.member':
if matrix_is_telegram(event['state_key']):
continue
user_id = event['state_key']
content = event['content']
2016-09-13 16:17:11 +02:00
sender = db.session.query(db.MatrixUser)\
.filter_by(matrix_id=user_id).first()
if sender:
displayname = sender.name
else:
displayname = get_username(user_id)
if content['membership'] == 'join':
displayname = content['displayname'] or get_username(user_id)
if not sender:
sender = db.MatrixUser(user_id, displayname)
else:
sender.name = displayname
db.session.add(sender)
msg = '> {} has joined the room'.format(displayname)
await group.send_text(msg)
elif content['membership'] == 'leave':
msg = '< {} has left the room'.format(displayname)
await group.send_text(msg)
elif content['membership'] == 'ban':
msg = '<! {} was banned from the room'.format(displayname)
await group.send_text(msg)
db.session.commit()
2016-09-13 16:17:11 +02:00
return create_response(200, {})
2016-09-26 03:52:59 +02:00
async def _matrix_request(method_fun, category, path, user_id, data=None,
content_type=None):
# pylint: disable=too-many-arguments
# Due to this being a helper function, the argument count acceptable
if content_type is None:
content_type = 'application/octet-stream'
2016-09-13 16:17:11 +02:00
if data is not None:
if isinstance(data, dict):
2016-09-26 04:00:23 +02:00
data = json.dumps(data)
2016-09-13 16:17:11 +02:00
content_type = 'application/json; charset=utf-8'
params = {'access_token': AS_TOKEN}
if user_id is not None:
params['user_id'] = user_id
2016-09-26 03:52:59 +02:00
async with method_fun('{}_matrix/{}/r0/{}'
.format(MATRIX_HOST, quote(category), quote(path)),
2016-09-26 04:00:23 +02:00
params=params, data=data,
2016-09-26 03:52:59 +02:00
headers={'Content-Type': content_type}) as response:
if response.headers['Content-Type'].split(';')[0] \
== 'application/json':
2016-09-13 16:17:11 +02:00
return await response.json()
else:
return await response.read()
2016-09-26 03:52:59 +02:00
2016-09-13 16:17:11 +02:00
def matrix_post(category, path, user_id, data, content_type=None):
2016-09-26 03:52:59 +02:00
return _matrix_request(MATRIX_SESS.post, category, path, user_id, data,
content_type)
2016-09-13 16:17:11 +02:00
def matrix_put(category, path, user_id, data, content_type=None):
2016-09-26 03:52:59 +02:00
return _matrix_request(MATRIX_SESS.put, category, path, user_id, data,
content_type)
2016-09-13 16:17:11 +02:00
def matrix_get(category, path, user_id):
2016-09-26 03:52:59 +02:00
return _matrix_request(MATRIX_SESS.get, category, path, user_id)
2016-09-13 16:17:11 +02:00
def matrix_delete(category, path, user_id):
2016-09-26 03:52:59 +02:00
return _matrix_request(MATRIX_SESS.delete, category, path, user_id)
2016-09-13 16:17:11 +02:00
async def matrix_room(request):
room_alias = request.match_info['room_alias']
args = parse_qs(urlparse(request.path_qs).query)
2016-09-26 03:52:59 +02:00
print('Checking for {} | {}'.format(unquote(room_alias),
args['access_token'][0]))
2016-09-13 16:17:11 +02:00
try:
if args['access_token'][0] != HS_TOKEN:
return create_response(403, {'errcode': 'M_FORBIDDEN'})
except KeyError:
2016-09-26 03:52:59 +02:00
return create_response(401,
{'errcode':
'NL.SIJMENSCHOON.TELEMATRIX_UNAUTHORIZED'})
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
localpart = room_alias.split(':')[0]
2016-09-13 16:17:11 +02:00
chat = '_'.join(localpart.split('_')[1:])
# Look up the chat in the database
2016-09-26 03:52:59 +02:00
if chat in TELEGRAM_CHATS:
await matrix_post('client', 'createRoom', None,
{'room_alias_name': localpart[1:]})
2016-09-13 16:17:11 +02:00
return create_response(200, {})
else:
2016-09-26 03:52:59 +02:00
return create_response(404, {'errcode':
'NL.SIJMENSCHOON.TELEMATRIX_NOT_FOUND'})
2016-09-13 16:17:11 +02:00
def send_matrix_message(room_id, user_id, txn_id, **kwargs):
2016-09-26 03:52:59 +02:00
return matrix_put('client', 'rooms/{}/send/m.room.message/{}'
.format(room_id, txn_id), user_id, kwargs)
2016-09-13 16:17:11 +02:00
async def upload_tgfile_to_matrix(file_id, user_id):
2016-09-26 03:52:59 +02:00
file_path = (await TG_BOT.get_file(file_id))['file_path']
request = await TG_BOT.download_file(file_path)
2016-09-13 16:17:11 +02:00
mimetype = request.headers['Content-Type']
data = await request.read()
j = await matrix_post('media', 'upload', user_id, data, mimetype)
if 'content_uri' in j:
2016-09-26 03:52:59 +02:00
return j['content_uri'], mimetype, len(data)
2016-09-13 16:17:11 +02:00
else:
return None, None, 0
2016-09-26 03:52:59 +02:00
2016-09-13 16:17:11 +02:00
async def register_join_matrix(chat, room_id, user_id):
name = chat.sender['first_name']
if 'last_name' in chat.sender:
name += ' ' + chat.sender['last_name']
name += ' (Telegram)'
user = user_id.split(':')[0][1:]
2016-09-26 03:52:59 +02:00
await matrix_post('client', 'register', None,
{'type': 'm.login.application_service', 'user': user})
profile_photos = await TG_BOT.get_user_profile_photos(chat.sender['id'])
2016-09-13 16:17:11 +02:00
try:
pp_file_id = profile_photos['result']['photos'][0][-1]['file_id']
pp_uri, _, _ = await upload_tgfile_to_matrix(pp_file_id, user_id)
if pp_uri:
2016-09-26 03:52:59 +02:00
await matrix_put('client', 'profile/{}/avatar_url'.format(user_id),
user_id, {'avatar_url': pp_uri})
2016-09-13 16:17:11 +02:00
except IndexError:
pass
2016-09-26 03:52:59 +02:00
await matrix_put('client', 'profile/{}/displayname'.format(user_id),
user_id, {'displayname': name})
2016-09-13 16:17:11 +02:00
await matrix_post('client', 'join/{}'.format(room_id), user_id, {})
2016-09-26 03:52:59 +02:00
@TG_BOT.handle('photo')
2016-09-13 16:17:11 +02:00
async def aiotg_photo(chat, photo):
try:
2016-09-26 03:52:59 +02:00
room_id = TELEGRAM_CHATS[str(chat.id)]
2016-09-13 16:17:11 +02:00
except KeyError:
print('Unknown telegram chat {}'.format(chat))
return
user_id = USER_ID_FORMAT.format(chat.sender['id'])
txn_id = quote('{}:{}'.format(chat.message['message_id'], chat.id))
file_id = photo[-1]['file_id']
uri, mime, length = await upload_tgfile_to_matrix(file_id, user_id)
2016-09-26 03:52:59 +02:00
info = {'mimetype': mime, 'size': length, 'h': photo[-1]['height'],
'w': photo[-1]['width']}
body = 'Image_{}{}'.format(int(time() * 1000),
mimetypes.guess_extension(mime))
2016-09-13 16:17:11 +02:00
if uri:
2016-09-26 03:52:59 +02:00
j = await send_matrix_message(room_id, user_id, txn_id, body=body,
url=uri, info=info, msgtype='m.image')
2016-09-13 16:17:11 +02:00
if 'errcode' in j and j['errcode'] == 'M_FORBIDDEN':
await register_join_matrix(chat, room_id, user_id)
2016-09-26 03:52:59 +02:00
await send_matrix_message(room_id, user_id, txn_id, body=body,
url=uri, info=info, msgtype='m.image')
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
@TG_BOT.command(r'/alias')
async def aiotg_alias(chat, match):
await chat.reply('The Matrix alias for this chat is #telegram_{}:{}'
.format(chat.id, MATRIX_HOST_BARE))
2016-09-26 03:52:59 +02:00
@TG_BOT.command(r'(?s)(.*)')
2016-09-13 16:17:11 +02:00
async def aiotg_message(chat, match):
link = db.session.query(db.ChatLink).filter_by(tg_room=chat.id).first()
if link:
room_id = link.matrix_room
else:
2016-11-12 02:33:51 +00:00
print('Unknown telegram chat {}: {}'.format(chat, chat.id))
2016-09-13 16:17:11 +02:00
return
user_id = USER_ID_FORMAT.format(chat.sender['id'])
txn_id = quote('{}:{}'.format(chat.message['message_id'], chat.id))
2016-09-13 16:17:11 +02:00
message = match.group(0)
2016-09-26 03:52:59 +02:00
if 'forward_from' in chat.message:
fw_from = chat.message['forward_from']
if 'last_name' in fw_from:
2016-09-26 03:52:59 +02:00
msg_from = '{} {} (Telegram)'.format(fw_from['first_name'],
fw_from['last_name'])
else:
msg_from = '{} (Telegram)'.format(fw_from['first_name'])
quoted_msg = '\n'.join(['>{}'.format(x) for x in message.split('\n')])
2016-11-15 08:28:42 +01:00
quoted_msg = 'Forwarded from {}:\n{}' \
2016-11-15 07:00:00 +00:00
.format(msg_from, quoted_msg)
2016-09-26 03:52:59 +02:00
quoted_html = '<blockquote>{}</blockquote>' \
.format(html.escape(message).replace('\n', '<br />'))
2016-11-15 08:28:42 +01:00
quoted_html = '<i>Forwarded from {}:</i>\n{}' \
2016-11-15 07:00:00 +00:00
.format(html.escape(msg_from), quoted_html)
2016-09-26 03:52:59 +02:00
j = await send_matrix_message(room_id, user_id, txn_id,
body=quoted_msg,
formatted_body=quoted_html,
format='org.matrix.custom.html',
msgtype='m.text')
elif 'reply_to_message' in chat.message:
re_msg = chat.message['reply_to_message']
if 'last_name' in re_msg['from']:
2016-09-26 03:52:59 +02:00
msg_from = '{} {} (Telegram)'.format(re_msg['from']['first_name'],
re_msg['from']['last_name'])
else:
msg_from = '{} (Telegram)'.format(re_msg['from']['first_name'])
2016-09-26 03:52:59 +02:00
date = datetime.fromtimestamp(re_msg['date']) \
2016-11-15 08:28:42 +01:00
.strftime('%Y-%m-%d %H:%M:%S')
2016-09-26 03:52:59 +02:00
quoted_msg = '\n'.join(['>{}'.format(x)
for x in re_msg['text'].split('\n')])
2016-11-15 08:28:42 +01:00
quoted_msg = 'Reply to {} ({}):\n{}\n\n{}' \
2016-09-26 03:52:59 +02:00
.format(msg_from, date, quoted_msg, message)
2016-11-15 08:28:42 +01:00
html_message = html.escape(message).replace('\n', '<br />')
2016-09-26 03:52:59 +02:00
quoted_html = '<blockquote>{}</blockquote>' \
.format(html.escape(re_msg['text'])
.replace('\n', '<br />'))
2016-11-15 08:28:42 +01:00
quoted_html = '<i>Reply to {} ({}):</i><br />{}<p>{}</p>' \
2016-09-26 03:52:59 +02:00
.format(html.escape(msg_from), html.escape(str(date)),
2016-11-15 08:28:42 +01:00
quoted_html, html_message)
2016-09-26 03:52:59 +02:00
j = await send_matrix_message(room_id, user_id, txn_id,
body=quoted_msg,
formatted_body=quoted_html,
format='org.matrix.custom.html',
msgtype='m.text')
else:
2016-09-26 03:52:59 +02:00
j = await send_matrix_message(room_id, user_id, txn_id, body=message,
msgtype='m.text')
2016-09-13 16:17:11 +02:00
if 'errcode' in j and j['errcode'] == 'M_FORBIDDEN':
await asyncio.sleep(0.1)
2016-09-13 16:17:11 +02:00
await register_join_matrix(chat, room_id, user_id)
await asyncio.sleep(0.1)
2016-09-26 03:52:59 +02:00
await send_matrix_message(room_id, user_id, txn_id, body=message,
msgtype='m.text')
2016-09-13 16:17:11 +02:00
2016-09-26 03:52:59 +02:00
def main():
"""
Main function to get the entire ball rolling.
"""
2016-09-13 16:17:11 +02:00
logging.basicConfig(level=logging.WARNING)
db.initialize(DATABASE_URL)
2016-09-13 16:17:11 +02:00
loop = asyncio.get_event_loop()
2016-09-26 03:52:59 +02:00
asyncio.ensure_future(TG_BOT.loop())
2016-09-13 16:17:11 +02:00
app = web.Application(loop=loop)
app.router.add_route('GET', '/rooms/{room_alias}', matrix_room)
2016-09-26 03:52:59 +02:00
app.router.add_route('PUT', '/transactions/{transaction}',
matrix_transaction)
2016-09-13 16:17:11 +02:00
web.run_app(app, port=5000)
2016-09-26 03:52:59 +02:00
if __name__ == "__main__":
main()