mirror of
https://git.notmuchmail.org/git/notmuch
synced 2024-11-24 20:08:10 +01:00
3a311ed5ec
Originally contributed by Brian Sniffen [1]. Quite a few unpublished fixes from Daniel Kahn Gilmour. We've been running it a few years now as the "official" archive of the notmuch mailing list. There also a few fixes from myself and Austin Ray. Finally I converted it to the new python bindings. This commit squashes the several years of development history and moves it under devel, in recognition of the now established role it plays in the project infrastructure. [1]: id:87tvyvp4f2.fsf@istari.evenmere.org
366 lines
12 KiB
Python
Executable file
366 lines
12 KiB
Python
Executable file
#!/usr/bin/env python
|
|
|
|
from __future__ import absolute_import
|
|
|
|
try:
|
|
from urllib.parse import quote_plus
|
|
from urllib.parse import unquote_plus
|
|
except ImportError:
|
|
from urllib import quote_plus
|
|
from urllib import unquote_plus
|
|
|
|
from datetime import datetime
|
|
from mailbox import MaildirMessage
|
|
import mimetypes
|
|
import email
|
|
import re
|
|
import html
|
|
import os
|
|
|
|
import bleach
|
|
import web
|
|
from notmuch2 import Database
|
|
from jinja2 import Environment, FileSystemLoader # FIXME to PackageLoader
|
|
from jinja2 import Markup
|
|
try:
|
|
import bjoern # from https://github.com/jonashaag/bjoern/
|
|
use_bjoern = True
|
|
except:
|
|
use_bjoern = False
|
|
|
|
# Configuration options
|
|
safe_tags = bleach.sanitizer.ALLOWED_TAGS + \
|
|
[u'div', u'span', u'p', u'br', u'table', u'tr', u'td', u'th']
|
|
linkify_plaintext = True # delays page load by about 0.02s of 0.20s budget
|
|
show_thread_nav = True # delays page load by about 0.04s of 0.20s budget
|
|
|
|
prefix = os.environ.get('NMWEB_PREFIX', "http://localhost:8080")
|
|
webprefix = os.environ.get('NMWEB_STATIC', prefix + "/static")
|
|
cachedir = os.environ.get('NMWEB_CACHE', "static/cache") # special for webpy server; changeable if using your own
|
|
cachepath = os.environ.get('NMWEB_CACHE_PATH', cachedir) # location of static cache in the local filesystem
|
|
|
|
if 'NMWEB_DEBUG' in os.environ:
|
|
web.config.debug = True
|
|
else:
|
|
web.config.debug = False
|
|
|
|
# End of config options
|
|
|
|
env = Environment(autoescape=True,
|
|
loader=FileSystemLoader('templates'))
|
|
|
|
urls = (
|
|
'/', 'index',
|
|
'/search/(.*)', 'search',
|
|
'/show/(.*)', 'show',
|
|
)
|
|
|
|
def urlencode_filter(s):
|
|
if type(s) == 'Markup':
|
|
s = s.unescape()
|
|
s = s.encode('utf8')
|
|
s = quote_plus(s)
|
|
return Markup(s)
|
|
env.filters['url'] = urlencode_filter
|
|
|
|
class index:
|
|
def GET(self):
|
|
web.header('Content-type', 'text/html')
|
|
base = env.get_template('base.html')
|
|
template = env.get_template('index.html')
|
|
db = Database()
|
|
tags = db.tags
|
|
return template.render(tags=tags,
|
|
title="Notmuch webmail",
|
|
prefix=prefix,
|
|
sprefix=webprefix)
|
|
|
|
class search:
|
|
def GET(self, terms):
|
|
redir = False
|
|
if web.input(terms=None).terms:
|
|
redir = True
|
|
terms = web.input().terms
|
|
terms = unquote_plus (terms)
|
|
if web.input(afters=None).afters:
|
|
afters = web.input(afters=None).afters[:-3]
|
|
else:
|
|
afters = '0'
|
|
if web.input(befores=None).befores:
|
|
befores = web.input(befores=None).befores
|
|
else:
|
|
befores = '4294967296' # 2^32
|
|
try:
|
|
if int(afters) > 0 or int(befores) < 4294967296:
|
|
redir = True
|
|
terms += ' date:@%s..@%s' % (int(afters), int(befores))
|
|
except ValueError:
|
|
pass
|
|
if redir:
|
|
raise web.seeother('/search/%s' % quote_plus(terms.encode('utf8')))
|
|
web.header('Content-type', 'text/html')
|
|
db = Database()
|
|
ts = db.threads(query=terms, sort=Database.SORT.NEWEST_FIRST)
|
|
template = env.get_template('search.html')
|
|
return template.generate(terms=terms,
|
|
ts=ts,
|
|
title=terms,
|
|
prefix=prefix,
|
|
sprefix=webprefix)
|
|
|
|
def format_time_range(start, end):
|
|
if end-start < (60*60*24):
|
|
time = datetime.fromtimestamp(start).strftime('%Y %b %d %H:%M')
|
|
else:
|
|
start = datetime.fromtimestamp(start).strftime("%Y %b %d")
|
|
end = datetime.fromtimestamp(end).strftime("%Y %b %d")
|
|
time = "%s through %s" % (start, end)
|
|
return time
|
|
env.globals['format_time_range'] = format_time_range
|
|
|
|
def mailto_addrs(msg,header_name):
|
|
try:
|
|
hdr = msg.header(header_name)
|
|
except LookupError:
|
|
return ''
|
|
|
|
frm = email.utils.getaddresses([hdr])
|
|
return ','.join(['<a href="mailto:%s">%s</a> ' % ((l, p) if p else (l, l)) for (p, l) in frm])
|
|
env.globals['mailto_addrs'] = mailto_addrs
|
|
|
|
def link_msg(msg):
|
|
lnk = quote_plus(msg.messageid.encode('utf8'))
|
|
try:
|
|
subj = msg.header('Subject')
|
|
except LookupError:
|
|
subj = ""
|
|
out = '<a href="%s/show/%s">%s</a>' % (prefix, lnk, subj)
|
|
return out
|
|
env.globals['link_msg'] = link_msg
|
|
|
|
def show_msgs(msgs):
|
|
r = '<ul>'
|
|
for msg in msgs:
|
|
red = 'color:black; font-style:normal'
|
|
if msg.matched:
|
|
red = 'color:red; font-style:italic'
|
|
frm = mailto_addrs(msg,'From')
|
|
lnk = link_msg(msg)
|
|
tags = ", ".join(msg.tags)
|
|
rs = show_msgs(msg.replies())
|
|
r += '<li><span style="%s">%s—%s</span> [%s] %s</li>' % (red, frm, lnk, tags, rs)
|
|
r += '</ul>'
|
|
return r
|
|
env.globals['show_msgs'] = show_msgs
|
|
|
|
# As email.message.walk, but showing close tags as well
|
|
def mywalk(self):
|
|
yield self
|
|
if self.is_multipart():
|
|
for subpart in self.get_payload():
|
|
for subsubpart in mywalk(subpart):
|
|
yield subsubpart
|
|
yield 'close-div'
|
|
|
|
class show:
|
|
def GET(self, mid):
|
|
web.header('Content-type', 'text/html')
|
|
db = Database()
|
|
try:
|
|
m = db.find(mid)
|
|
except:
|
|
raise web.notfound("No such message id.")
|
|
template = env.get_template('show.html')
|
|
# FIXME add reply-all link with email.urils.getaddresses
|
|
# FIXME add forward link using mailto with body parameter?
|
|
return template.render(m=m,
|
|
mid=mid,
|
|
title=m.header('Subject'),
|
|
prefix=prefix,
|
|
sprefix=webprefix)
|
|
|
|
def thread_nav(m):
|
|
if not show_thread_nav: return
|
|
db = Database()
|
|
thread = next(db.threads('thread:'+m.threadid))
|
|
prv = None
|
|
found = False
|
|
nxt = None
|
|
for msg in thread:
|
|
if m == msg:
|
|
found = True
|
|
elif not found:
|
|
prv = msg
|
|
else: # found message, but not on this loop
|
|
nxt = msg
|
|
break
|
|
yield "<hr><ul>"
|
|
if prv: yield "<li>Previous message (by thread): %s</li>" % link_msg(prv)
|
|
if nxt: yield "<li>Next message (by thread): %s</li>" % link_msg(nxt)
|
|
yield "</ul><h3>Thread:</h3>"
|
|
# FIXME show now takes three queries instead of 1;
|
|
# can we yield the message body while computing the thread shape?
|
|
thread = next(db.threads('thread:'+m.threadid))
|
|
yield show_msgs(thread.toplevel())
|
|
return
|
|
env.globals['thread_nav'] = thread_nav
|
|
|
|
def format_message(nm_msg, mid):
|
|
fn = list(nm_msg.filenames())[0]
|
|
msg = MaildirMessage(open(fn))
|
|
return format_message_walk(msg, mid)
|
|
|
|
def decodeAnyway(txt, charset='ascii'):
|
|
try:
|
|
out = txt.decode(charset)
|
|
except:
|
|
try:
|
|
out = txt.decode('utf-8')
|
|
except UnicodeDecodeError:
|
|
out = txt.decode('latin1')
|
|
return out
|
|
|
|
def require_protocol_prefix(attrs, new=False):
|
|
if not new:
|
|
return attrs
|
|
link_text = attrs[u'_text']
|
|
if link_text.startswith(('http:', 'https:', 'mailto:', 'git:', 'id:')):
|
|
return attrs
|
|
return None
|
|
|
|
# Bleach doesn't even try to linkify id:... text, so no point invoking this yet
|
|
def modify_id_links(attrs, new=False):
|
|
if attrs[(None, u'href')].startswith(u'id:'):
|
|
attrs[(None, u'href')] = prefix + "/show/" + attrs[(None, u'href')][3:]
|
|
return attrs
|
|
|
|
def css_part_id(content_type, parts=[]):
|
|
c = content_type.replace('/', '-')
|
|
out = "-".join(parts + [c])
|
|
return out
|
|
|
|
def format_message_walk(msg, mid):
|
|
counter = 0
|
|
cid_refd = []
|
|
parts = ['main']
|
|
for part in mywalk(msg):
|
|
if part == 'close-div':
|
|
parts.pop()
|
|
yield '</div>'
|
|
elif part.get_content_maintype() == 'multipart':
|
|
yield '<div class="multipart-%s" id="%s">' % \
|
|
(part.get_content_subtype(), css_part_id(part.get_content_type(), parts))
|
|
parts.append(part.get_content_subtype())
|
|
if part.get_content_subtype() == 'alternative':
|
|
yield '<ul>'
|
|
for subpart in part.get_payload():
|
|
yield ('<li><a href="#%s">%s</a></li>' %
|
|
(css_part_id(subpart.get_content_type(), parts),
|
|
subpart.get_content_type()))
|
|
yield '</ul>'
|
|
elif part.get_content_type() == 'message/rfc822':
|
|
# FIXME extract subject, date, to/cc/from into a separate template and use it here
|
|
yield '<div class="message-rfc822">'
|
|
elif part.get_content_maintype() == 'text':
|
|
if part.get_content_subtype() == 'plain':
|
|
yield '<div id="%s">' % css_part_id(part.get_content_type(), parts)
|
|
yield '<pre>'
|
|
out = part.get_payload(decode=True)
|
|
out = decodeAnyway(out, part.get_content_charset('ascii'))
|
|
out = html.escape(out)
|
|
out = out.encode('ascii', 'xmlcharrefreplace').decode('ascii')
|
|
if linkify_plaintext: out = bleach.linkify(out, callbacks=[require_protocol_prefix])
|
|
yield out
|
|
yield '</pre></div>'
|
|
elif part.get_content_subtype() == 'html':
|
|
yield '<div id="%s">' % css_part_id(part.get_content_type(), parts)
|
|
unb64 = part.get_payload(decode=True)
|
|
decoded = decodeAnyway(unb64, part.get_content_charset('ascii'))
|
|
cid_refd += find_cids(decoded)
|
|
part.set_payload(bleach.clean(replace_cids(decoded, mid), tags=safe_tags).
|
|
encode(part.get_content_charset('ascii'), 'xmlcharrefreplace'))
|
|
(filename, cid) = link_to_cached_file(part, mid, counter)
|
|
counter += 1
|
|
yield '<iframe class="embedded-html" src="%s"></iframe>' % \
|
|
os.path.join(prefix, cachedir, mid, filename)
|
|
yield '</div>'
|
|
else:
|
|
yield '<div id="%s">' % css_part_id(part.get_content_type(), parts)
|
|
(filename, cid) = link_to_cached_file(part, mid, counter)
|
|
counter += 1
|
|
yield '<a href="%s">%s (%s)</a>' % (os.path.join(prefix,
|
|
cachedir,
|
|
mid,
|
|
filename),
|
|
filename,
|
|
part.get_content_type())
|
|
yield '</div>'
|
|
elif part.get_content_maintype() == 'image':
|
|
(filename, cid) = link_to_cached_file(part, mid, counter)
|
|
if cid not in cid_refd:
|
|
counter += 1
|
|
yield '<img src="%s" alt="%s">' % (os.path.join(prefix,
|
|
cachedir,
|
|
mid,
|
|
filename),
|
|
filename)
|
|
else:
|
|
(filename, cid) = link_to_cached_file(part, mid, counter)
|
|
counter += 1
|
|
yield '<a href="%s">%s (%s)</a>' % (os.path.join(prefix,
|
|
cachedir,
|
|
mid,
|
|
filename),
|
|
filename,
|
|
part.get_content_type())
|
|
env.globals['format_message'] = format_message
|
|
|
|
def replace_cids(body, mid):
|
|
return body.replace('cid:', os.path.join(prefix, cachedir, mid)+'/')
|
|
|
|
def find_cids(body):
|
|
return re.findall(r'cid:([^ "\'>]*)', body)
|
|
|
|
def link_to_cached_file(part, mid, counter):
|
|
filename = part.get_filename()
|
|
if not filename:
|
|
ext = mimetypes.guess_extension(part.get_content_type())
|
|
if not ext:
|
|
ext = '.bin'
|
|
filename = 'part-%03d%s' % (counter, ext)
|
|
try:
|
|
os.makedirs(os.path.join(cachepath, mid))
|
|
except OSError:
|
|
pass
|
|
fn = os.path.join(cachepath, mid, filename) # FIXME escape mid, filename
|
|
fp = open(fn, 'wb')
|
|
if part.get_content_maintype() == 'text':
|
|
data = part.get_payload(decode=True)
|
|
data = decodeAnyway(data, part.get_content_charset('ascii')).encode('utf-8')
|
|
else:
|
|
try:
|
|
data = part.get_payload(decode=True)
|
|
except:
|
|
data = part.get_payload(decode=False)
|
|
if data:
|
|
fp.write(data)
|
|
fp.close()
|
|
if 'Content-ID' in part:
|
|
cid = part['Content-ID']
|
|
if cid[0] == '<' and cid[-1] == '>': cid = cid[1:-1]
|
|
cid_fn = os.path.join(cachepath, mid, cid) # FIXME escape mid, cid
|
|
try:
|
|
os.unlink(cid_fn)
|
|
except OSError:
|
|
pass
|
|
os.link(fn, cid_fn)
|
|
return (filename, cid)
|
|
else:
|
|
return (filename, None)
|
|
|
|
if __name__ == '__main__':
|
|
app = web.application(urls, globals())
|
|
if use_bjoern:
|
|
bjoern.run(app.wsgifunc(), "127.0.0.1", 8080)
|
|
else:
|
|
app.run()
|