"""WWW request handler (also used in the stand-alone server).
"""
__docformat__ = 'restructuredtext'
import base64
import binascii
import codecs
import email.utils
import errno
import logging
import mimetypes
import os
import re
import socket
import stat
import sys
import tempfile
import time
from email.mime.multipart import MIMEMultipart
from traceback import format_exc
try:
from OpenSSL.SSL import SysCallError
except ImportError:
class SysCallError(Exception):
pass
import roundup.anypy.email_ # noqa: F401 -- patches for email library code
from roundup import hyperdb, rest, xmlrpc
# quality of random checked below
from roundup.anypy import http_, random_, urllib_, xmlrpc_
from roundup.anypy.cgi_ import cgi
from roundup.anypy.cookie_ import BaseCookie, CookieError, SimpleCookie, get_cookie_date
from roundup.anypy.html import html_escape
from roundup.anypy.strings import b2s, bs2b, is_us, s2b, uchr
from roundup.cgi import TranslationService, accept_language, actions, cgitb, templating
from roundup.cgi.exceptions import (
DetectorError,
FormError,
IndexerQueryError,
NotFound,
NotModified,
RateLimitExceeded,
Reauth,
Redirect,
SendFile,
SendStaticFile,
SeriousError,
)
from roundup.cgi.form_parser import FormParser
from roundup.exceptions import (
LoginError,
Reject,
RejectRaw,
Unauthorised,
UsageError,
)
from roundup.logcontext import gen_trace_id, store_trace_reason
from roundup.mailer import Mailer, MessageSendError
from roundup.mlink_expr import ExpressionError
logger = logging.getLogger('roundup')
if not random_.is_weak:
logger.debug("Importing good random generator")
else:
logger.warning("**SystemRandom not available. Using poor random generator")
def initialiseSecurity(security):
'''Create some Permissions and Roles on the security object
This function is directly invoked by security.Security.__init__()
as a part of the Security object instantiation.
'''
p = security.addPermission(
name="Web Access",
description="User may access the web interface")
security.addPermissionToRole('Admin', p)
p = security.addPermission(
name="Rest Access",
description="User may access the rest interface")
security.addPermissionToRole('Admin', p)
p = security.addPermission(
name="Xmlrpc Access",
description="User may access the xmlrpc interface")
security.addPermissionToRole('Admin', p)
# doing Role stuff through the web - make sure Admin can
# TODO: deprecate this and use a property-based control
p = security.addPermission(
name="Web Roles",
description="User may manipulate user Roles through the web")
security.addPermissionToRole('Admin', p)
def add_message(msg_list, msg, escape=True):
if escape:
msg = html_escape(msg, quote=False).replace('\n', ' \n')
else:
msg = msg.replace('\n', ' \n')
msg_list.append(msg)
return msg_list # for unittests
# if set to False via interfaces.py do not log a warning when
# xmlrpc is used and defusedxml is not installed.
WARN_FOR_MISSING_DEFUSEDXML = True
default_err_msg = ''"""
An error has occurred
An error has occurred
A problem was encountered processing your request.
The tracker maintainers have been notified of the problem.
"""
def seed_pseudorandom():
'''A function to seed the default pseudorandom random number generator
which is used to (at minimum):
* generate part of email message-id
* generate OTK for password reset
* generate the temp recovery password
This function limits the scope of the 'import random' call
as the random identifier is used throughout the code and
can refer to SystemRandom.
'''
import random
random.seed()
class LiberalCookie(SimpleCookie):
""" Python's SimpleCookie throws an exception if the cookie uses invalid
syntax. Other applications on the same server may have done precisely
this, preventing roundup from working through no fault of roundup.
Numerous other python apps have run into the same problem:
trac: http://trac.edgewall.org/ticket/2256
mailman: http://bugs.python.org/issue472646
This particular implementation comes from trac's solution to the
problem. Unfortunately it requires some hackery in SimpleCookie's
internals to provide a more liberal __set method.
"""
def load(self, rawdata, ignore_parse_errors=True):
if ignore_parse_errors:
self.bad_cookies = []
self._BaseCookie__set = self._loose_set
SimpleCookie.load(self, rawdata)
if ignore_parse_errors:
self._BaseCookie__set = self._strict_set
for key in self.bad_cookies:
del self[key]
_strict_set = BaseCookie._BaseCookie__set
def _loose_set(self, key, real_value, coded_value):
try:
self._strict_set(key, real_value, coded_value)
except CookieError:
self.bad_cookies.append(key)
dict.__setitem__(self, key, None)
class Session:
"""
Needs DB to be already opened by client
Session attributes at instantiation:
- "client" - reference to client for add_cookie function
- "session_db" - session DB manager
- "cookie_name" - name of the cookie with session id
- "_sid" - session id for current user
- "_data" - session data cache
session = Session(client)
session.set(name=value)
value = session.get(name)
session.destroy() # delete current session
session.clean_up() # clean up session table
session.update(set_cookie=True, expire=3600*24*365)
# refresh session expiration time, setting persistent
# cookie if needed to last for 'expire' seconds
"""
def __init__(self, client):
self._data = {}
self._sid = None
self.client = client
self.session_db = client.db.getSessionManager()
# parse cookies for session id
if self.client.secure:
cookie_template = '__Secure-roundup_session_%s'
else:
cookie_template = 'roundup_session_%s'
self.cookie_name = cookie_template % \
re.sub('[^a-zA-Z]', '', client.instance.config.TRACKER_NAME)
cookies = LiberalCookie(client.env.get('HTTP_COOKIE', ''))
if self.cookie_name in cookies:
try:
self._sid = cookies[self.cookie_name].value
self._data = self.session_db.getall(self._sid)
except KeyError:
self._sid = None
# remove old cookie
self.client.add_cookie(self.cookie_name, None)
def _gen_sid(self):
""" generate a unique session key """
while 1:
s = b2s(binascii.b2a_base64(random_.token_bytes(32)).strip()).rstrip('=')
if not self.session_db.exists(s):
break
return s
def clean_up(self):
"""Remove expired sessions"""
self.session_db.clean()
def destroy(self):
self.client.add_cookie(self.cookie_name, None)
self._data = {}
if self._sid:
self.session_db.destroy(self._sid)
self.session_db.commit()
def get(self, name, default=None):
return self._data.get(name, default)
def set(self, **kwargs):
self._data.update(kwargs)
if not self._sid:
self._sid = self._gen_sid()
self.session_db.set(self._sid, **self._data)
# add session cookie
self.update(set_cookie=True)
# XXX added when patching 1.4.4 for backward compatibility
# XXX remove
self.client.session = self._sid
else:
self.session_db.set(self._sid, **self._data)
self.session_db.commit()
def update(self, set_cookie=False, expire=None):
""" update timestamp in db to avoid expiration
if 'set_cookie' is True, set cookie with 'expire' seconds lifetime
if 'expire' is None - session will be closed with the browser
XXX the session can be purged within a week even if a cookie
lifetime is longer
"""
self.session_db.updateTimestamp(self._sid)
self.session_db.commit()
if set_cookie:
self.client.add_cookie(self.cookie_name, self._sid, expire=expire)
# import from object as well so it's a new style object and I can use super()
class BinaryFieldStorage(cgi.FieldStorage, object):
'''This class works around the bug https://bugs.python.org/issue27777.
cgi.FieldStorage must save all data as binary/bytes. This is
needed for handling json and xml data blobs under python
3. Under python 2, str and binary are interchangable, not so
under 3.
'''
def make_file(self, mode=None):
''' work around https://bugs.python.org/issue27777 '''
if self.length >= 0:
return tempfile.TemporaryFile("wb+")
return super(BinaryFieldStorage, self).make_file()
class Client:
"""Instantiate to handle one CGI request.
See inner_main for request processing.
Client attributes at instantiation:
- "path" is the PATH_INFO inside the instance (with no leading '/')
- "base" is the base URL for the instance
- "form" is the cgi form, an instance of FieldStorage from the standard
cgi module
- "additional_headers" is a dictionary of additional HTTP headers that
should be sent to the client
- "response_code" is the HTTP response code to send to the client
- "translator" is TranslationService instance
- "clientnonce" is a unique value for this client connection. Can be
used as a nonce for CSP headers and to sign javascript code
presented to the browser. This is different from the CSRF nonces
and can not be used for anti-csrf measures.
During the processing of a request, the following attributes are used:
- "db"
- "_error_message" holds a list of error messages
- "_ok_message" holds a list of OK messages
- "session" is deprecated in favor of session_api (XXX remove)
- "session_api" is the interface to store data in session
- "user" is the current user's name
- "userid" is the current user's id
- "template" is the current :template context
- "classname" is the current class context name
- "nodeid" is the current context item id
Note: _error_message and _ok_message should not be modified
directly, use add_ok_message and add_error_message, these, by
default, escape the message added to avoid XSS security issues.
User Identification:
Users that are absent in session data are anonymous and are logged
in as that user. This typically gives them all Permissions assigned
to the Anonymous Role.
Every user is assigned a session. "session_api" is the interface
to work with session data.
Special form variables:
Note that in various places throughout this code, special form
variables of the form : are used. The colon (":") part may
actually be one of either ":" or "@".
"""
# charset used for data storage and form templates
# Note: must be in lower case for comparisons!
# XXX take this from instance.config?
STORAGE_CHARSET = 'utf-8'
#
# special form variables
#
FV_TEMPLATE = re.compile(r'[@:]template')
FV_OK_MESSAGE = re.compile(r'[@:]ok_message')
FV_ERROR_MESSAGE = re.compile(r'[@:]error_message')
# Note: index page stuff doesn't appear here:
# columns, sort, sortdir, filter, group, groupdir, search_text,
# pagesize, startwith
# list of network error codes that shouldn't be reported to tracker admin
# (error descriptions from FreeBSD intro(2))
IGNORE_NET_ERRORS = (
# A write on a pipe, socket or FIFO for which there is
# no process to read the data.
errno.EPIPE,
# A connection was forcibly closed by a peer.
# This normally results from a loss of the connection
# on the remote socket due to a timeout or a reboot.
errno.ECONNRESET,
# Software caused connection abort. A connection abort
# was caused internal to your host machine.
errno.ECONNABORTED,
# A connect or send request failed because the connected party
# did not properly respond after a period of time.
errno.ETIMEDOUT,
)
# Cache_Control[key] = Cache-Control header value
# Key can be explicitly file basename - value applied to just that file
# takes precedence over mime type.
# Key can be mime type - all files of that mimetype will get the value
Cache_Control = {
'application/javascript': "public, max-age=1209600", # 2 weeks
'text/javascript': "public, max-age=1209600", # 2 weeks
'text/css': "public, max-age=4838400", # 8 weeks/2 mnths
}
# list of valid http compression (Content-Encoding) algorithms
# we have available
compressors = []
try:
# Only one provided by standard library
import gzip
compressors.append('gzip')
except ImportError:
pass
try:
import brotli
compressors.append('br')
except ImportError:
pass
try:
import zstd
compressors.append('zstd')
except ImportError:
pass
# everything not here is served as 'application/octet-stream'
# Moved to class so it can be modified from interfaces.py
# Adding:
# from roundup.cgi.client import Client
# Client.mime_type_allowlist.append('application/pdf')
# will permit pdf files to be displayed in the browser rather than
# downloaded to a file.
mime_type_allowlist = [
'text/plain',
'text/x-csrc', # .c
'text/x-chdr', # .h
'text/x-patch', # .patch and .diff
'text/x-python', # .py
'text/xml',
'text/csv',
'text/css',
'image/gif',
'image/jpeg',
'image/png',
'image/svg+xml',
'image/webp',
'audio/ogg',
'video/webm',
]
# mime types of files that are already compressed and should not be
# compressed on the fly. Can be extended/reduced using interfaces.py.
# This excludes types from being compressed. Should we have a list
# of mime types we should compress? write_html() calls compress_encode
# which uses this without a content-type so that's an issue.
# Also for text based data, might have charset too so need to parse
# content-type.
precompressed_mime_types = ["image/png", "image/jpeg"]
@gen_trace_id()
@store_trace_reason('client', extract="args[3]['PATH_INFO']")
def __init__(self, instance, request, env, form=None, translator=None):
# re-seed the random number generator. Is this is an instance of
# random.SystemRandom it has no effect.
random_.seed()
# So we also seed the pseudorandom random source obtained from
# import random
# to make sure that every forked copy of the client will return
# new random numbers.
seed_pseudorandom()
self.start = time.time()
self.instance = instance
self.request = request
self.env = env
if translator is not None:
self.setTranslator(translator)
# set self.language to "translator"'s language
try:
self.language = translator.info()["language"]
except (AttributeError, KeyError):
# info() missing or no language key
self.language = ""
else:
self.setTranslator(TranslationService.NullTranslationService())
self.language = "" # as is the default from determine_language
self.mailer = Mailer(instance.config)
# If True the form contents wins over the database contents when
# rendering html properties. This is set when an error occurs so
# that we don't lose submitted form contents.
self.form_wins = False
# save off the path
self.path = env['PATH_INFO']
# this is the base URL for this tracker
self.base = self.instance.config.TRACKER_WEB
# should cookies be secure?
self.secure = self.base.startswith('https')
# check the tracker_web setting
if not self.base.endswith('/'):
self.base = self.base + '/'
# this is the "cookie path" for this tracker (ie. the path part of
# the "base" url)
self.cookie_path = urllib_.urlparse(self.base)[2]
# cookies to set in http responce
# {(path, name): (value, expire)}
self._cookies = {}
# define a unique nonce. Can be used for Content Security Policy
# nonces for scripts.
self.client_nonce = self._gen_nonce()
# see if we need to re-parse the environment for the form (eg Zope)
if form is None:
# cgi.FieldStorage doesn't special case OPTIONS, DELETE or
# PATCH verbs. They are processed like POST. So FieldStorage
# hangs on these verbs trying to read posted data that
# will never arrive.
# If not defined, set CONTENT_LENGTH to 0 so it doesn't
# hang reading the data.
if self.env['REQUEST_METHOD'] in ['OPTIONS', 'DELETE', 'PATCH'] \
and 'CONTENT_LENGTH' not in self.env:
self.env['CONTENT_LENGTH'] = 0
logger.debug("Setting CONTENT_LENGTH to 0 for method: %s",
self.env['REQUEST_METHOD'])
# cgi.FieldStorage must save all data as
# binary/bytes. Subclass BinaryFieldStorage does this.
# It's a workaround for a bug in cgi.FieldStorage. See class
# def for details.
self.form = BinaryFieldStorage(fp=request.rfile, environ=env)
else:
self.form = form
# When the CONTENT-TYPE is not 'application/x-www-form-urlencoded':
# or multipart/*, cgi.(Mini)FieldStorage sets the list property to
# None. Initialize an empty list property in this case so we can
# query the list in all cases.
try:
if (self.form.list is None):
self.form.list = []
except AttributeError:
# self.form should always be some type of
# FieldStorage. If we get an AttributeError,
# print what the form is.
# FIXME: plan on removing this in 2028 to improve
# performance if there are no reports of it being triggered.
logger.error(("Invalid self.form found (please report "
"to the roundup-users mailing list): %s") % self.form)
raise
# turn debugging on/off
try:
self.debug = int(env.get("ROUNDUP_DEBUG", 0))
except ValueError:
# someone gave us a non-int debug level, turn it off
self.debug = 0
# flag to indicate that the HTTP headers have been sent
self.headers_done = 0
# record of headers sent for debugging
self.headers_sent = []
# additional headers to send with the request - must be registered
# before the first write
self.additional_headers = {}
self.response_code = 200
# default character set
self.charset = self.STORAGE_CHARSET
# parse cookies (used for charset lookups)
# use our own LiberalCookie to handle bad apps on the same
# server that have set cookies that are out of spec
self.cookie = LiberalCookie(self.env.get('HTTP_COOKIE', ''))
self.user = None
self.userid = None
self.nodeid = None
self.classname = None
self.template = None
self._ok_message = []
self._error_message = []
def _gen_nonce(self):
""" generate a unique nonce """
return b2s(base64.b32encode(random_.token_bytes(40)))
def setTranslator(self, translator=None):
"""Replace the translation engine
'translator'
is TranslationService instance.
It must define methods 'translate' (TAL-compatible i18n),
'gettext' and 'ngettext' (gettext-compatible i18n).
If omitted, create default TranslationService.
"""
if translator is None:
translator = TranslationService.get_translation(
language=self.instance.config["TRACKER_LANGUAGE"],
tracker_home=self.instance.config["TRACKER_HOME"])
self.translator = translator
self._ = self.gettext = translator.gettext
self.ngettext = translator.ngettext
@gen_trace_id()
@store_trace_reason('client_main', extract="args[0].env['PATH_INFO']")
def main(self):
""" Wrap the real main in a try/finally so we always close off the db.
"""
# strip HTTP_PROXY issue2550925 in case
# PROXY header is set.
if 'HTTP_PROXY' in self.env:
del (self.env['HTTP_PROXY'])
if 'HTTP_PROXY' in os.environ:
del (os.environ['HTTP_PROXY'])
xmlrpc_enabled = self.instance.config.WEB_ENABLE_XMLRPC
rest_enabled = self.instance.config.WEB_ENABLE_REST
try:
if xmlrpc_enabled and self.path == 'xmlrpc':
self.handle_xmlrpc()
elif rest_enabled and (self.path == 'rest' or
self.path[:5] == 'rest/'):
self.handle_rest()
else:
self.inner_main()
finally:
if hasattr(self, 'db'):
self.db.close()
def handle_xmlrpc(self):
if self.env.get('CONTENT_TYPE') != 'text/xml':
self.write(
b"This is the endpoint of Roundup " +
b"XML-RPC interface.")
return
# Pull the raw XML out of the form. The "value" attribute
# will be the raw content of the POST request.
assert self.form.file
input_data = self.form.value
# So that the rest of Roundup can query the form in the
# usual way, we create an empty list of fields.
self.form.list = []
# Set the charset and language, since other parts of
# Roundup may depend upon that.
self.determine_charset()
if self.instance.config["WEB_TRANSLATE_XMLRPC"]:
self.determine_language()
# Open the database as the correct user.
try:
self.determine_user(is_api="xmlrpc")
self.db.tx_Source = "xmlrpc"
self.db.i18n = self.translator
except LoginError as msg:
output = xmlrpc_.client.dumps(
xmlrpc_.client.Fault(401, "%s" % msg),
allow_none=True)
self.setHeader("Content-Type", "text/xml")
self.setHeader("Content-Length", str(len(output)))
self.write(s2b(output))
return
except RateLimitExceeded as msg:
output = xmlrpc_.client.dumps(
xmlrpc_.client.Fault(429, "%s" % msg),
allow_none=True)
self.setHeader("Content-Type", "text/xml")
self.setHeader("Content-Length", str(len(output)))
self.write(s2b(output))
return
if not self.db.security.hasPermission('Xmlrpc Access', self.userid):
output = xmlrpc_.client.dumps(
xmlrpc_.client.Fault(403, "Forbidden"),
allow_none=True)
self.setHeader("Content-Type", "text/xml")
self.setHeader("Content-Length", str(len(output)))
self.write(s2b(output))
return
self.check_anonymous_access()
try:
# coverting from function returning true/false to
# raising exceptions
# Call csrf with xmlrpc checks enabled.
# It will return True if everything is ok,
# raises exception on check failure.
csrf_ok = self.handle_csrf(api=True)
except (Unauthorised, UsageError):
# report exception back to server
exc_type, exc_value, exc_tb = sys.exc_info()
output = xmlrpc_.client.dumps(
xmlrpc_.client.Fault(1, "%s:%s" % (exc_type, exc_value)),
allow_none=True)
csrf_ok = False # we had an error, failed check
if csrf_ok is True:
if WARN_FOR_MISSING_DEFUSEDXML and (not xmlrpc_.client.defusedxml):
logger.warning(self._("XMLRPC endpoint is not using defusedxml. Improve security by installing defusedxml."))
handler = xmlrpc.RoundupDispatcher(self.db,
self.instance.actions,
self.translator,
allow_none=True)
output = handler.dispatch(input_data)
self.setHeader("Content-Type", "text/xml")
self.setHeader("Content-Length", str(len(output)))
self.write(output)
def is_cors_preflight(self):
return (
self.env['REQUEST_METHOD'] == "OPTIONS"
and self.request.headers.get("Access-Control-Request-Method")
# technically Access-Control-Request-Headers (ACRH) is
# optional, but we require the header x-requested-with,
# so ACRH will be present.
and self.request.headers.get("Access-Control-Request-Headers")
and self.request.headers.get("Origin"))
def handle_preflight(self):
# Call rest library to handle the pre-flight request
handler = rest.RestfulInstance(self, self.db)
output = handler.dispatch(self.env['REQUEST_METHOD'],
self.path, self.form)
if self.response_code == 204:
self.write("")
else:
self.setHeader("Content-Length", str(len(output)))
self.write(output)
def reject_request(self, message, message_type="text/plain",
status=http_.client.UNAUTHORIZED):
self.response_code = status
self.setHeader("Content-Length", str(len(message)))
self.setHeader("Content-Type", message_type)
self.write(message)
def handle_rest(self):
# Set the charset and language
self.determine_charset()
if self.instance.config["WEB_TRANSLATE_REST"]:
self.determine_language()
# Open the database as the correct user.
# TODO: add everything to RestfulDispatcher
try:
self.determine_user(is_api="rest")
self.db.tx_Source = "rest"
self.db.i18n = self.translator
except LoginError as err:
output = s2b("Invalid Login - %s" % str(err))
self.reject_request(output, status=http_.client.UNAUTHORIZED)
return
except RateLimitExceeded as err:
output = s2b("%s" % str(err))
self.reject_request(output,
status=http_.client.TOO_MANY_REQUESTS)
return
# Handle CORS preflight request. We know rest is enabled
# because handle_rest is called. Preflight requests
# are unauthenticated, so no need to check permissions.
if (self.is_cors_preflight()):
# Origin header must be defined to get here
if self.is_origin_header_ok(api=True):
self.handle_preflight()
else:
# origin is not authorized for REST
msg = self._("Client is not allowed to use Rest Interface.")
output = s2b(
'{ "error": { "status": 400, "msg": "%s" } }' % msg)
self.reject_request(output,
message_type="application/json",
status=400)
return
if not self.db.security.hasPermission('Rest Access', self.userid):
output = s2b('{ "error": { "status": 403, "msg": "Forbidden." } }')
self.reject_request(output,
message_type="application/json",
status=403)
return
# verify Origin is allowed on all requests including GET.
# If a GET, missing origin is allowed (i.e. same site GET request)
if not self.is_origin_header_ok(api=True):
if 'HTTP_ORIGIN' not in self.env:
msg = self._("Required Header Missing")
err = "REST request missing 'Origin' header by user %(user)s."
else:
msg = self._("Client is not allowed to use Rest Interface.")
err = "REST request 'Origin' (%(origin)s) unauthorized by user %(user)s."
# Use code 400. Codes 401 and 403 imply that authentication
# is needed or authenticated person is not authorized.
output = s2b(
'{ "error": { "status": 400, "msg": "%s" } }' % msg)
self.reject_request(output,
message_type="application/json",
status=400)
# Would be nice to log the original source address here to
# allow firewalling in case of abuse/attack. Especially if
# anonymous is allowed REST access. However,
# self.request.connection.getpeername()
# only gets us 127.0.0.1 when a proxy is used. I think the
# same is true of wsgi mode (but it might be a UNIX domain
# socket address). The upstream server needs to supply the
# real IP as it sees it and we need to consume it. There
# is no method for this that handles all the ways roundup
# can be run AFAIK. So no IP address, just user.
logger.error(err, {"user": self.user,
"origin": self.env.get('HTTP_ORIGIN', None)})
return
self.check_anonymous_access()
try:
# Call csrf with api (xmlrpc, rest) checks enabled.
# It will return True if everything is ok,
# raises exception on check failure.
# Note this returns true for a GET request.
# Must check supplied Origin header for bad value first.
csrf_ok = self.handle_csrf(api=True)
except (Unauthorised, UsageError) as msg:
# FIXME should format return value according to
# client's accept header, so application/xml, text/plain etc..
output = s2b('{ "error": { "status": 400, "msg": "%s"}}' %
str(msg))
self.reject_request(output,
message_type="application/json",
status=400)
csrf_ok = False # we had an error, failed check
return
# With the return above the if will never be false,
# Keeping the if so we can remove return to pass
# output though and format output according to accept
# header.
if csrf_ok is True:
# Call rest library to handle the request
handler = rest.RestfulInstance(self, self.db)
output = handler.dispatch(self.env['REQUEST_METHOD'],
self.path, self.form)
# type header set by rest handler
# self.setHeader("Content-Type", "text/xml")
if self.response_code == 204: # no body with 204
self.write("")
else:
self.setHeader("Content-Length", str(len(output)))
self.write(output)
def add_ok_message(self, msg, escape=True):
add_message(self._ok_message, msg, escape)
def add_error_message(self, msg, escape=True):
add_message(self._error_message, msg, escape)
# Want to interpret form values when rendering when an error
# occurred:
self.form_wins = True
def inner_main(self):
"""Process a request.
The most common requests are handled like so:
1. look for charset and language preferences, set up user locale
see determine_charset, determine_language
2. figure out who we are, defaulting to the "anonymous" user
see determine_user
3. figure out what the request is for - the context
see determine_context
4. handle any requested action (item edit, search, ...)
see handle_action
5. render a template, resulting in HTML output
In some situations, exceptions occur:
- HTTP Redirect (generally raised by an action)
- SendFile (generally raised by determine_context)
serve up a FileClass "content" property
- SendStaticFile (generally raised by determine_context)
serve up a file from the tracker "html" directory
- Unauthorised (generally raised by an action)
the action is cancelled, the request is rendered and an error
message is displayed indicating that permission was not
granted for the action to take place
- templating.Unauthorised (templating action not permitted)
raised by an attempted rendering of a template when the user
doesn't have permission
- NotFound (raised wherever it needs to be)
percolates up to the CGI interface that called the client
"""
self._ok_message = []
self._error_message = []
try:
self.determine_charset()
try:
# make sure we're identified (even anonymously)
self.determine_user()
# figure out the context and desired content template
self.determine_context()
self.determine_language()
self.db.i18n = self.translator
# if we've made it this far the context is to a bit of
# Roundup's real web interface (not a file being served up)
# so do the Anonymous Web Access check now
self.check_anonymous_access()
# check for a valid csrf token identifying the right user
csrf_ok = True
try:
# coverting from function returning true/false to
# raising exceptions
csrf_ok = self.handle_csrf()
except (UsageError, Unauthorised) as msg:
csrf_ok = False
self.form_wins = True
self.add_error_message(' '.join(msg.args))
# If csrf checks pass. Run actions etc.
# handle_action() may handle a form submit action.
# It can change self.classname and self.template,
# and may also append error/ok_messages.
html = self.handle_action() if csrf_ok else None
if html:
self.write_html(html)
return
# now render the page
# we don't want clients caching our dynamic pages
self.additional_headers['Cache-Control'] = 'no-cache'
# pages with messages added expire right now
# simple views may be cached for a small amount of time
# TODO? make page expire time configurable
# always expire pages, as IE just doesn't seem to do the
# right thing here :(
date = time.time() - 1
# if self._error_message or self._ok_message:
# date = time.time() - 1
# else:
# date = time.time() + 5
self.additional_headers['Expires'] = \
email.utils.formatdate(date, usegmt=True)
# render the content
self.write_html(self.renderContext())
except SendFile as designator:
# The call to serve_file may result in an Unauthorised
# exception or a NotModified exception. Those
# exceptions will be handled by the outermost set of
# exception handlers.
self.determine_language()
self.db.i18n = self.translator
# prevent application/octet-stream mime type in header
# from being changed to some other type by the browser
# when mime sniffing.
self.setHeader("X-Content-Type-Options", "nosniff")
# prevent script execution in downloaded SVG, XML files
# (or HTML files if enabled).
self.setHeader("Content-Security-Policy", "script-src 'none'")
self.serve_file(designator)
except SendStaticFile as file:
self.serve_static_file(str(file))
except IOError:
# IOErrors here are due to the client disconnecting before
# receiving the reply.
pass
except SysCallError:
# OpenSSL.SSL.SysCallError is similar to IOError above
pass
except RateLimitExceeded:
raise
except SeriousError as message:
self.write_html(str(message))
except Reauth as e:
self.reauth(e)
except Redirect as url:
# let's redirect - if the url isn't None, then we need to do
# the headers, otherwise the headers have been set before the
# exception was raised
if url:
self.additional_headers['Location'] = str(url)
self.response_code = 302
self.write_html('Redirecting to %s' % (url, url))
except LoginError as message:
# The user tried to log in, but did not provide a valid
# username and password. If we support HTTP
# authorization, send back a response that will cause the
# browser to prompt the user again.
if self.instance.config.WEB_HTTP_AUTH:
self.response_code = http_.client.UNAUTHORIZED
realm = self.instance.config.TRACKER_NAME
self.setHeader("WWW-Authenticate",
'Basic realm="%s"' % realm)
else:
self.response_code = http_.client.FORBIDDEN
self.renderFrontPage(str(message))
except Unauthorised as message:
# users may always see the front page
self.response_code = 403
self.renderFrontPage(str(message))
except NotModified:
# send the 304 response
self.response_code = 304
self.header()
except NotFound as e:
if self.response_code == 400:
# We can't find a parameter (e.g. property name
# incorrect). Tell the user what was raised.
# Do not change to the 404 template since the
# base url is valid just query args are not.
# copy the page format from SeriousError _str_ exception.
error_page = """
Roundup issue tracker: An error has occurred
%s
"""
self.write_html(error_page % str(e))
else:
self.response_code = 404
self.template = '404'
try:
# generates keyerror if class does not exist
self.db.getclass(self.classname)
self.write_html(self.renderContext())
except KeyError:
# we can't map the URL to a class we know about
# reraise the NotFound and let roundup_server
# handle it
raise NotFound(e)
except FormError as e:
self.add_error_message(self._('Form Error: ') + str(e))
self.write_html(self.renderContext())
except RateLimitExceeded as e:
self.add_error_message(str(e))
self.write_html(self.renderContext())
except IOError:
# IOErrors here are due to the client disconnecting before
# receiving the reply.
# may happen during write_html and serve_file, too.
pass
except SysCallError:
# OpenSSL.SSL.SysCallError is similar to IOError above
# may happen during write_html and serve_file, too.
pass
except DetectorError as e:
if not self.instance.config.WEB_DEBUG:
# run when we are not in debug mode, so errors
# go to admin too.
self.send_error_to_admin(e.subject, e.html, e.txt)
self.write_html(e.html)
else:
# in debug mode, only write error to screen.
self.write_html(e.html)
except Exception as e: # noqa: F841
# Something has gone badly wrong. Therefore, we should
# make sure that the response code indicates failure.
if self.response_code == http_.client.OK:
self.response_code = http_.client.INTERNAL_SERVER_ERROR
# Help the administrator work out what went wrong.
html = ("
Traceback
"
+ cgitb.html(i18n=self.translator)
+ ("
Environment Variables
%s
"
% cgitb.niceDict("", self.env)))
if not self.instance.config.WEB_DEBUG:
exc_info = sys.exc_info()
subject = "Error: %s" % exc_info[1]
self.send_error_to_admin(subject, html, format_exc())
self.write_html(self._(default_err_msg))
else:
self.write_html(html)
def clean_sessions(self):
"""Deprecated
XXX remove
"""
self.clean_up()
def clean_up(self):
"""Remove expired sessions and One Time Keys.
Do it only once an hour.
"""
hour = 60 * 60
now = time.time()
# XXX: hack - use OTK table to store last_clean time information
# 'last_clean' string is used instead of otk key
otks = self.db.getOTKManager()
last_clean = otks.get('last_clean', 'last_use', 0)
if now - last_clean < hour:
return
self.session_api.clean_up()
otks.clean()
otks.set('last_clean', last_use=now)
otks.commit()
def determine_charset(self):
"""Look for client charset in the form parameters or browser cookie.
If no charset requested by client, use storage charset (utf-8).
If the charset is found, and differs from the storage charset,
recode all form fields of type 'text/plain'
"""
# look for client charset
charset_parameter = 0
# Python 2.6 form may raise a TypeError if list in form is None
charset = None
try:
charset = self.form['@charset'].value
if charset.lower() == "none":
charset = ""
charset_parameter = 1
except (KeyError, TypeError):
pass
if charset is None and 'roundup_charset' in self.cookie:
charset = self.cookie['roundup_charset'].value
if charset:
# make sure the charset is recognized
try:
codecs.lookup(charset)
except LookupError:
self.add_error_message(self._('Unrecognized charset: %r') %
charset)
charset_parameter = 0
else:
self.charset = charset.lower()
# If we've got a character set in request parameters,
# set the browser cookie to keep the preference.
# This is done after codecs.lookup to make sure
# that we aren't keeping a wrong value.
if charset_parameter:
self.add_cookie('roundup_charset', charset)
# if client charset is different from the storage charset,
# recode form fields
# XXX this requires FieldStorage from Python library.
# mod_python FieldStorage is not supported!
if self.charset != self.STORAGE_CHARSET:
decoder = codecs.getdecoder(self.charset)
encoder = codecs.getencoder(self.STORAGE_CHARSET)
re_charref = re.compile('([0-9]+|x[0-9a-f]+);', re.IGNORECASE)
def _decode_charref(matchobj):
num = matchobj.group(1)
uc = int(num[1:], 16) if num[0].lower() == 'x' else int(num)
return uchr(uc)
for field_name in self.form:
field = self.form[field_name]
if (field.type == 'text/plain') and not field.filename:
try:
value = decoder(field.value)[0]
except UnicodeError:
continue
value = re_charref.sub(_decode_charref, value)
field.value = encoder(value)[0]
def determine_language(self):
"""Determine the language"""
# look for language parameter
# then for language cookie
# last for the Accept-Language header
# Python 2.6 form may raise a TypeError if list in form is None
language = None
try:
language = self.form["@language"].value
if language.lower() == "none":
language = ""
self.add_cookie("roundup_language", language)
except (KeyError, TypeError):
pass
if language is None:
if "roundup_language" in self.cookie:
language = self.cookie["roundup_language"].value
elif self.instance.config["WEB_USE_BROWSER_LANGUAGE"]:
hal = self.env.get('HTTP_ACCEPT_LANGUAGE')
language = accept_language.parse(hal)
else:
language = ""
if not language:
# default to tracker language
language = self.instance.config["TRACKER_LANGUAGE"]
# this maybe is not correct, as get_translation could not
# find desired locale and switch back to "en" but we set
# self.language to the desired language !
self.language = language
self.setTranslator(TranslationService.get_translation(
language,
tracker_home=self.instance.config["TRACKER_HOME"]))
def authenticate_bearer_token(self, challenge):
''' authenticate the bearer token. Refactored from determine_user()
to allow it to be overridden if needed.
'''
try: # will jwt import?
import jwt
except ImportError:
# no support for jwt, this is fine.
self.setHeader("WWW-Authenticate", "Basic")
raise LoginError('Support for jwt disabled.')
# If first ',' separated token is < 32, jwt is disabled.
# If second or later tokens are < 32 chars, the config system
# stops the tracker from starting so insecure tokens can not
# be used.
CHARS_FOR_256_BIT_KEY = 32
if len(self.db.config.WEB_JWT_SECRET[0]) < CHARS_FOR_256_BIT_KEY:
# no support for jwt, this is fine.
self.setHeader("WWW-Authenticate", "Basic")
raise LoginError('Support for jwt disabled by admin.')
last_error = "Unknown error validating bearer token."
for secret in self.db.config.WEB_JWT_SECRET:
try: # handle jwt exceptions
return jwt.decode(challenge, secret,
algorithms=['HS256'],
audience=self.db.config.TRACKER_WEB,
issuer=self.db.config.TRACKER_WEB)
except jwt.exceptions.InvalidSignatureError as err:
# Try more signatures.
# If all signatures generate InvalidSignatureError,
# we exhaust the loop and last_error is used to
# report the final (but not only) InvalidSignatureError
last_error = str(err) # preserve for end of loop
except jwt.exceptions.InvalidTokenError as err:
self.setHeader("WWW-Authenticate", "Basic, Bearer")
self.make_user_anonymous()
raise LoginError(str(err))
# reach here only if no valid signature was found
self.setHeader("WWW-Authenticate", "Basic, Bearer")
self.make_user_anonymous()
raise LoginError(last_error)
def determine_user(self, is_api=False):
"""Determine who the user is"""
self.opendb('admin')
# if we get a jwt, it includes the roles to be used for this session
# so we define a new function to encpsulate and return the jwt roles
# and not take the roles from the database.
override_get_roles = None
# get session data from db
# XXX: rename
self.session_api = Session(self)
# take the opportunity to cleanup expired sessions and otks
self.clean_up()
user = None
# first up, try http authorization if enabled
cfg = self.instance.config
remote_user_header = cfg.WEB_HTTP_AUTH_HEADER or 'REMOTE_USER'
if cfg.WEB_COOKIE_TAKES_PRECEDENCE:
user = self.session_api.get('user')
if user:
# update session lifetime datestamp
self.session_api.update()
if remote_user_header in self.env:
del self.env[remote_user_header]
if not user and cfg.WEB_HTTP_AUTH:
if remote_user_header in self.env:
# we have external auth (e.g. by Apache)
user = self.env[remote_user_header]
if cfg.WEB_HTTP_AUTH_CONVERT_REALM_TO_LOWERCASE and '@' in user:
u, d = user.split('@', 1)
user = '@'.join((u, d.lower()))
elif self.env.get('HTTP_AUTHORIZATION', ''):
# try handling Basic Auth ourselves
auth = self.env['HTTP_AUTHORIZATION']
try:
scheme, challenge = auth.split(' ', 1)
except ValueError:
# Invalid header.
scheme = ''
challenge = ''
if scheme.lower() == 'basic':
try:
decoded = b2s(base64.b64decode(challenge))
except TypeError:
# invalid challenge
decoded = ''
try:
username, password = decoded.split(':', 1)
except ValueError:
# Invalid challenge.
username = ''
password = ''
try:
# Current user may not be None, otherwise
# instatiation of the login action will fail.
# So we set the user to anonymous first.
self.make_user_anonymous()
login = self.get_action_class('login')(self)
login.verifyLogin(username, password, is_api=is_api)
except (LoginError, RateLimitExceeded):
self.make_user_anonymous()
raise
user = username
# try to seed with something harder to guess than
# just the time. If random is SystemRandom,
# this is a no-op.
random_.seed("%s%s" % (password, time.time()))
elif scheme.lower() == 'bearer':
token = self.authenticate_bearer_token(challenge)
from roundup.hyperdb import iter_roles
# if we got here token is valid, use the role
# and sub claims.
try:
# make sure to str(token['sub']) the
# subject. As decoded by json, it is unicode
# which throws an error when used with 'nodeid
# in db' down the call chain.
user = self.db.user.get(str(token['sub']), 'username')
except IndexError:
raise LoginError("Token subject is invalid.")
# validate roles
all_rolenames = [role[0] for role in self.db.security.role.items()]
for r in token['roles']:
if r.lower() not in all_rolenames:
raise LoginError("Token roles are invalid.")
# will be used later to override the get_roles method
# having it defined as truthy allows it to be used.
override_get_roles = lambda self: iter_roles( # noqa: ARG005
','.join(token['roles']))
# if user was not set by http authorization, try session lookup
if not user:
user = self.session_api.get('user')
if user:
# update session lifetime datestamp
self.session_api.update()
# if no user name set by http authorization or session lookup
# the user is anonymous
if not user:
user = 'anonymous'
# sanity check on the user still being valid,
# getting the userid at the same time
try:
self.userid = self.db.user.lookup(user)
except (KeyError, TypeError):
user = 'anonymous'
# make sure the anonymous user is valid if we're using it
if user == 'anonymous':
self.make_user_anonymous()
else:
self.user = user
# reopen the database as the correct user
self.opendb(self.user)
if override_get_roles:
# opendb destroys and re-opens the db if instance.optimize
# is not true. This deletes an override of get_roles. So
# assign get_roles override from the jwt if needed at this
# point.
self.db.user.get_roles = override_get_roles
def check_anonymous_access(self):
"""Check that the Anonymous user is actually allowed to use the web
interface and short-circuit all further processing if they're not.
"""
# allow Anonymous to use the "login" and "register" actions (noting
# that "register" has its own "Register" permission check)
action = ''
try:
if ':action' in self.form:
action = self.form[':action']
elif '@action' in self.form:
action = self.form['@action']
except TypeError:
pass
if isinstance(action, list):
raise SeriousError(
self._('broken form: multiple @action values submitted'))
if action != '':
# '' is value when no action parameter was found so run
# this to extract action string value when action found.
action = action.value.lower()
if action in ('login', 'register'):
return
# allow Anonymous to view the "user" "register" template if they're
# allowed to register
if (self.template == 'register' and self.classname == 'user'
and self.db.security.hasPermission('Register',
self.userid, 'user')):
return
# otherwise for everything else
if self.user == 'anonymous' and \
not self.db.security.hasPermission('Web Access', self.userid):
raise Unauthorised(self._("Anonymous users are not "
"allowed to use the web interface"))
def is_origin_header_ok(self, api=False, credentials=False):
"""Determine if origin is valid for the context
Header is ok (return True) if ORIGIN is missing and it is a GET.
Header is ok if ORIGIN matches the base url.
If this is an API call:
* Header is ok if ORIGIN matches an element of allowed_api_origins.
* Header is ok if allowed_api_origins includes '*' as first
element and credentials is False.
Otherwise header is not ok.
In a credentials context, if we match * we will return
header is not ok. All credentialed requests must be
explicitly matched.
"""
try:
origin = self.env['HTTP_ORIGIN']
except KeyError:
return self.env['REQUEST_METHOD'] == 'GET'
# note base https://host/... ends host with with a /,
# so add it to origin.
foundat = self.base.find(origin + '/')
if foundat == 0:
return True
if not api:
return False
allowed_origins = self.db.config['WEB_ALLOWED_API_ORIGINS']
# find a match for other possible origins
# Original spec says origin is case sensitive match.
# Living spec doesn't address Origin value's case or
# how to compare it. So implement case sensitive....
if origin in allowed_origins:
return True
# Block use of * when origin match is used for
# allowing credentials. See:
# https://developer.mozilla.org/en-US/docs/Web/HTTP/CORS
# under Credentials Requests and Wildcards
return (allowed_origins and allowed_origins[0] == '*'
and not credentials)
def is_referer_header_ok(self, api=False):
referer = self.env['HTTP_REFERER']
# parse referer and create an origin
referer_comp = urllib_.urlparse(referer)
# self.base always has trailing /, so add trailing / to referer_origin
referer_origin = "%s://%s/" % (referer_comp[0], referer_comp[1])
foundat = self.base.find(referer_origin)
if foundat == 0:
return True
if not api:
return False
allowed_origins = self.db.config['WEB_ALLOWED_API_ORIGINS']
if allowed_origins and allowed_origins[0] == '*':
return True
# For referer, loop over allowed_api_origins and
# see if any of them are a prefix to referer, case sensitive.
# Append / to each origin so that:
# an allowed_origin of https://my.host does not match
# a referer of https://my.host.com/my/path
for allowed_origin in allowed_origins:
foundat = referer_origin.find(allowed_origin + '/')
if foundat == 0:
return True
return False
def handle_csrf(self, api=False):
'''Handle csrf token lookup and validate current user and session
This implements (or tries to implement) the
Session-Dependent Nonce from
https://seclab.stanford.edu/websec/csrf/csrf.pdf.
Changing this to an HMAC(sessionid,secret) will
remove the need for saving a fair amount of
state on the server (one nonce per form per
page). If you have multiple forms/page this can
lead to abandoned csrf tokens that have to time
out and get cleaned up. But you lose per form
tokens which may be an advantage. Also the HMAC
is constant for the session, so provides more
occasions for it to be exposed.
This only runs on post (or put and delete for
future use). Nobody should be changing data
with a get.
A session token lifetime is settable in
config.ini. A future enhancement to the
creation routines should allow for the requester
of the token to set the lifetime.
The unique session key and user id is stored
with the token. The token is valid if the stored
values match the current client's userid and
session.
If a user logs out, the csrf keys are
invalidated since no other connection should
have the same session id.
At least to start I am reporting anti-csrf to
the user. If it's an attacker who can see the
site, they can see the @csrf fields and can
probably figure out that he needs to supply
valid headers. Or they can just read this code
8-). So hiding it doesn't seem to help but it
does arguably show the enforcement settings, but
given the newness of this code notifying the
user and having them notify the admins for
debugging seems to be an advantage.
'''
# Create the otks handle here as we need it almost immediately.
# If this is perf issue, set to None here and check below
# once all header checks have passed if it needs to be opened.
otks = self.db.getOTKManager()
# Assume: never allow changes via GET
if self.env['REQUEST_METHOD'] not in ['POST', 'PUT', 'DELETE']:
if (self.form.list is not None) and ("@csrf" in self.form):
# We have a nonce being used with a method it should
# not be. If the nonce exists, report to admin so they
# can fix the nonce leakage and destroy it. (nonces
# used in a get are more exposed than those used in a
# post.) Note, I don't attempt to validate here since
# existence here is the sign of a failure. If nonce
# exists try to report the referer header to try to
# find where this comes from so it can be fixed. If
# nonce doesn't exist just ignore it. Maybe we should
# report, but somebody could spam us with a ton of
# invalid keys and fill up the logs.
if 'HTTP_REFERER' in self.env:
referer = self.env['HTTP_REFERER']
else:
referer = self._("Referer header not available.")
key = self.form['@csrf'].value
if otks.exists(key):
logger.error(
self._("csrf key used with wrong method from: %s"),
referer)
otks.destroy(key)
otks.commit()
# do return here. Keys have been obsoleted.
# we didn't do a expire cycle of session keys,
# but that's ok.
return True
config = self.instance.config
current_user = self.db.getuid()
# List HTTP headers we check. Note that the xmlrpc header is
# missing. Its enforcement is different (yes/required are the
# same for example) so we don't include here.
header_names = [
"ORIGIN",
"REFERER",
"X-FORWARDED-HOST",
"HOST",
]
header_pass = 0 # count of passing header checks
# If required headers are missing, raise an error
for header in header_names:
if (config["WEB_CSRF_ENFORCE_HEADER_%s" % header] == 'required'
and "HTTP_%s" % header.replace('-', '_') not in self.env):
logger.error(self._(
''"csrf header %(header)s required but missing "
''"for user%(userid)s.") % {
'header': header,
'userid': current_user})
raise Unauthorised(self._("Missing header: %s") % header)
# self.base always matches: ^https?://hostname
enforce = config['WEB_CSRF_ENFORCE_HEADER_REFERER']
if 'HTTP_REFERER' in self.env and enforce != "no":
if not self.is_referer_header_ok(api=api):
referer = self.env['HTTP_REFERER']
logmsg = self._(
''"csrf Referer header check failed for user%(userid)s. "
''"Value=%(referer)s") % {'userid': current_user,
'referer': referer}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise Unauthorised(self._("Invalid Referer: %s") % (
referer))
if enforce == 'logfailure':
logger.warning(logmsg)
else:
header_pass += 1
# if you change these make sure to consider what
# happens if header variable exists but is empty.
# self.base.find("") returns 0 for example not -1
enforce = config['WEB_CSRF_ENFORCE_HEADER_ORIGIN']
if 'HTTP_ORIGIN' in self.env and enforce != "no":
if not self.is_origin_header_ok(api=api):
origin = self.env['HTTP_ORIGIN']
logmsg = self._(
''"csrf Origin header check failed for user%(userid)s. "
''"Value=%(origin)s") % {
'userid': current_user, 'origin': origin}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise Unauthorised(self._("Invalid Origin %s" % origin))
if enforce == 'logfailure':
logger.warning(logmsg)
else:
header_pass += 1
enforce = config['WEB_CSRF_ENFORCE_HEADER_X-FORWARDED-HOST']
if 'HTTP_X_FORWARDED_HOST' in self.env:
if enforce != "no":
host = self.env['HTTP_X_FORWARDED_HOST']
foundat = self.base.find('://' + host + '/')
# 4 means self.base has http:/ prefix, 5 means https:/ prefix
if foundat not in [4, 5]:
logmsg = self._(
''"csrf X-FORWARDED-HOST header check failed "
''"for user%(userid)s. Value=%(host)s") % {
'userid': current_user, 'host': host}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise Unauthorised(self._(
"Invalid X-FORWARDED-HOST %s") % host)
if enforce == 'logfailure':
logger.warning(logmsg)
else:
header_pass += 1
else:
# https://seclab.stanford.edu/websec/csrf/csrf.pdf
# recommends checking HTTP HOST header as well.
# If there is an X-FORWARDED-HOST header, check
# that only. The proxy setting X-F-H has probably set
# the host header to a local hostname that is
# internal name of system not name supplied by user.
enforce = config['WEB_CSRF_ENFORCE_HEADER_HOST']
if 'HTTP_HOST' in self.env and enforce != "no":
host = self.env['HTTP_HOST']
foundat = self.base.find('://' + host + '/')
# 4 means http:// prefix, 5 means https:// prefix
if foundat not in [4, 5]:
logmsg = self._(
''"csrf HOST header check failed for "
''"user%(userid)s. Value=%(host)s") % {
'userid': current_user, 'host': host}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise Unauthorised(self._("Invalid HOST %s") % host)
if enforce == 'logfailure':
logger.warning(logmsg)
else:
header_pass += 1
enforce = config['WEB_CSRF_HEADER_MIN_COUNT']
if header_pass < enforce:
logger.error(self._("Csrf: unable to verify sufficient headers"))
raise UsageError(self._("Unable to verify sufficient headers"))
enforce = config['WEB_CSRF_ENFORCE_HEADER_X-REQUESTED-WITH']
if api and enforce in ['required', 'yes']:
# if we get here we have usually passed at least one
# header check. We check for presence of this custom
# header for xmlrpc/rest calls only.
# E.G. X-Requested-With: XMLHttpRequest
# Note we do not use CSRF nonces for xmlrpc/rest requests.
#
# see: https://www.owasp.org/index.php/Cross-Site_Request_Forgery_(CSRF)_Prevention_Cheat_Sheet#Protecting_REST_Services:_Use_of_Custom_Request_Headers
if 'HTTP_X_REQUESTED_WITH' not in self.env:
logger.error(self._(
''"csrf X-REQUESTED-WITH xmlrpc required header "
''"check failed for user%(userid)s."),
{"userid": current_user})
raise UsageError(self._("Required Header Missing"))
# Expire old csrf tokens now so we don't use them. These will
# be committed after the otks.destroy below. Note that the
# self.clean_up run as part of determine_user() will run only
# once an hour. If we have short lived (e.g. 5 minute) keys
# they will live too long if we depend on clean_up. So we do
# our own.
otks.clean()
if api:
# Save removal of expired keys from database.
otks.commit()
# Return from here since we have done housekeeping
# and don't use csrf tokens for xmlrpc.
return True
# process @csrf tokens past this point.
key = None
nonce_user = None
nonce_session = None
if '@csrf' in self.form:
key = self.form['@csrf'].value
nonce_user = otks.get(key, 'uid', default=None)
nonce_session = otks.get(key, 'sid', default=None)
# The key has been used or compromised.
# Delete it to prevent replay.
otks.destroy(key)
# commit the deletion/expiration of all keys
otks.commit()
enforce = config['WEB_CSRF_ENFORCE_TOKEN']
if key is None: # we do not have an @csrf token
if enforce == 'required':
logger.error(self._(
"Required csrf field missing for user%(userid)s"),
{"userid": current_user})
raise UsageError(self._(
''"We can't validate your session (csrf failure). "
''"Re-enter any unsaved data and try again."))
if enforce == 'logfailure':
# FIXME include url
logger.warning(self._(
"csrf field not supplied by user%(userid)s"),
{"userid": current_user})
else:
# enforce is either yes or no. Both permit change if token is
# missing
return True
current_session = self.session_api._sid
# validate against user and session
if current_user != nonce_user:
logmsg = self._(
''"Csrf mismatch user: current user %(user)s != stored "
''"user %(stored)s, current session, stored session: "
''"%(cur_sess)s,%(stor_sess)s for key %(key)s.") % {
'user': current_user,
'stored': nonce_user,
'cur_sess': current_session,
'stor_sess': nonce_session,
'key': key}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise UsageError(self._(
''"We can't validate your session (csrf failure). "
''"Re-enter any unsaved data and try again."))
if enforce == 'logfailure':
logger.warning(logmsg)
if current_session != nonce_session:
logmsg = self._(
''"Csrf mismatch user: current session %(curr_sess)s "
''"!= stored session %(stor_sess)s, current user/stored "
''"user is: %(user)s for key %(key)s.") % {
'curr_sess': current_session,
'stor_sess': nonce_session,
'user': current_user,
'key': key}
if enforce in ('required', 'yes'):
logger.error(logmsg)
raise UsageError(self._(
''"We can't validate your session (csrf failure). "
''"Re-enter any unsaved data and try again."))
if enforce == 'logfailure':
logger.warning(logmsg)
# we are done and the change can occur.
return True
def opendb(self, username):
"""Open the database and set the current user.
Opens a database once. On subsequent calls only the user is set on
the database object the instance.optimize is set. If we are in
"Development Mode" (cf. roundup_server) then the database is always
re-opened.
"""
# don't do anything if the db is open and the user has not changed
if hasattr(self, 'db') and self.db.isCurrentUser(username):
return
# open the database or only set the user
if not hasattr(self, 'db'):
self.db = self.instance.open(username)
elif self.instance.optimize:
self.db.setCurrentUser(username)
else:
self.db.close()
self.db = self.instance.open(username)
# The old session API refers to the closed database;
# we can no longer use it.
self.session_api = Session(self)
self.db.tx_Source = "web"
# match designator in URL stripping leading 0's. So:
# https://issues.roundup-tracker.org/issue002551190 is the same as
# https://issues.roundup-tracker.org/issue2551190
# Note: id's are strings not numbers so "02" != "2" but 02 == 2
dre_url = re.compile(r'([^\d]+)0*(\d+)')
def determine_context(self, dre=dre_url):
"""Determine the context of this page from the URL:
The URL path after the instance identifier is examined. The path
is generally only one entry long.
- if there is no path, then we are in the "home" context.
- if the path is "@@file" (or "_file", then the additional
path entry specifies the filename of a static file we're to
serve up from the instance "html" directory. Raises a
SendStaticFile exception.(*)
- if there is something in the path (eg "issue"), it identifies
the tracker class we're to display.
- if the path is an item designator (eg "issue123"), then we're
to display a specific item.
- if the path starts with an item designator and is longer than
one entry, then we're assumed to be handling an item of a
FileClass, and the extra path information gives the filename
that the client is going to label the download with (ie
"file123/image.png" is nicer to download than "file123"). This
raises a SendFile exception.(*)
Both of the "*" types of contexts stop before we bother to
determine the template we're going to use. That's because they
don't actually use templates.
The template used is specified by the :template CGI variable,
which defaults to:
- only classname suplied: "index"
- full item designator supplied: "item"
We set:
self.classname - the class to display, can be None
self.template - the template to render the current context with
self.nodeid - the nodeid of the class we're displaying
"""
# default the optional variables
self.classname = None
self.nodeid = None
# see if a template or messages are specified
template_override = ok_message = error_message = None
try:
keys = self.form.keys()
except TypeError:
keys = ()
for key in keys:
if self.FV_TEMPLATE.match(key):
template_override = self.form[key].value
elif self.FV_OK_MESSAGE.match(key):
ok_message = self.form[key].value
elif self.FV_ERROR_MESSAGE.match(key):
error_message = self.form[key].value
# see if we were passed in a message
if ok_message:
self.add_ok_message(ok_message)
if error_message:
self.add_error_message(error_message)
# determine the classname and possibly nodeid
path = self.path.split('/')
if not path or path[0] in ('', 'home', 'index'):
if template_override is not None:
self.template = template_override
else:
self.template = ''
return
if path[0] in ('@@file', '_file'):
raise SendStaticFile(os.path.join(*path[1:]))
self.classname = path[0]
if len(path) > 1:
# send the file identified by the designator in path[0]
raise SendFile(path[0])
# see if we got a designator
m = dre.match(self.classname)
if m:
self.classname = m.group(1)
self.nodeid = m.group(2)
try:
klass = self.db.getclass(self.classname)
except KeyError:
raise NotFound('%s/%s' % (self.classname, self.nodeid))
if int(self.nodeid) > 2**31:
# Postgres will complain with a ProgrammingError
# if we try to pass in numbers that are too large
raise NotFound('%s/%s' % (self.classname, self.nodeid))
if not klass.hasnode(self.nodeid):
raise NotFound('%s/%s' % (self.classname, self.nodeid))
# with a designator, we default to item view
self.template = 'item'
else:
# with only a class, we default to index view
self.template = 'index'
# make sure the classname is valid
try:
self.db.getclass(self.classname)
except KeyError:
raise NotFound(self.classname)
# see if we have a template override
if template_override is not None:
self.template = template_override
def reauth(self, exception):
"""Processing for a Reauth exception raised from an auditor.
Can be overridden by code in tracker's interfaces.py.
"""
from roundup.anypy.cgi_ import MiniFieldStorage
original_action = self.form['@action'].value if '@action' \
in self.form else ""
original_template = self.template
self.template = 'reauth'
self.form.list = [x for x in self.form.list
if x.name not in ('@action',
'@csrf',
'@template'
)]
# save the action and template used when the Reauth as
# triggered. Will be used to resolve the change by the reauth
# action when when reauth password verified.
if '@next_action' not in self.form.list:
self.form.list.append(MiniFieldStorage('@next_action',
original_action))
if '@next_template' not in self.form.list:
self.form.list.append(MiniFieldStorage('@next_template',
original_template))
if exception.args and "@reauth_message" not in self.form.list:
self.form.list.append(
MiniFieldStorage('@reauth_message',
html_escape(exception.args[0])
)
)
self.write_html(self.renderContext())
# re for splitting designator, see also dre_url above this one
# doesn't strip leading 0's from the id. Why not??
dre = re.compile(r'([^\d]+)(\d+)')
def serve_file(self, designator, dre=dre):
""" Serve the file from the content property of the designated item.
"""
m = dre.match(str(designator))
if not m:
raise NotFound(str(designator))
classname, nodeid = m.group(1), m.group(2)
try:
klass = self.db.getclass(classname)
except KeyError:
# The classname was not valid.
raise NotFound(str(designator))
# perform the Anonymous user access check
self.check_anonymous_access()
# make sure we have the appropriate properties
props = klass.getprops()
if 'type' not in props:
raise NotFound(designator)
if 'content' not in props:
raise NotFound(designator)
# make sure we have permission
if not self.db.security.hasPermission('View', self.userid,
classname, 'content', nodeid):
raise Unauthorised(self._("You are not allowed to view "
"this file."))
# --- mime-type security
# mime type detection is performed in cgi.form_parser
if self.instance.config['WEB_ALLOW_HTML_FILE']:
self.mime_type_allowlist.append('text/html')
try:
mime_type = klass.get(nodeid, 'type')
except IndexError as e:
raise NotFound(e)
# Can happen for msg class:
if not mime_type:
mime_type = 'text/plain'
if mime_type not in self.mime_type_allowlist:
mime_type = 'application/octet-stream'
# --/ mime-type security
# If this object is a file (i.e., an instance of FileClass),
# see if we can find it in the filesystem. If so, we may be
# able to use the more-efficient request.sendfile method of
# sending the file. If not, just get the "content" property
# in the usual way, and use that.
content = None
filename = None
if isinstance(klass, hyperdb.FileClass):
try:
filename = self.db.filename(classname, nodeid)
except AttributeError:
# The database doesn't store files in the filesystem
# and therefore doesn't provide the "filename" method.
pass
except IOError:
# The file does not exist.
pass
if not filename:
content = klass.get(nodeid, 'content')
lmt = klass.get(nodeid, 'activity').timestamp()
self._serve_file(lmt, None, mime_type, content, filename)
def serve_static_file(self, file):
""" Serve up the file named from the templates dir
"""
# figure the filename - try STATIC_FILES, then TEMPLATES dir
for dir_option in ('STATIC_FILES', 'TEMPLATES'):
prefix = self.instance.config[dir_option]
if not prefix:
continue
if is_us(prefix):
# prefix can be a string or list depending on
# option. Make it a list to iterate over.
prefix = [prefix]
for p in prefix:
# if last element of STATIC_FILES ends with '/-',
# or \- on windows, we failed to find the file
# and should not look in TEMPLATES. So raise exception.
if (dir_option == 'STATIC_FILES' and p[-1:] == '-' and
p[-2:-1] in ('/', '\\')):
raise NotFound(file)
# ensure the load doesn't try to poke outside
# of the static files directory
p = os.path.normpath(p)
filename = os.path.normpath(os.path.join(p, file))
if os.path.isfile(filename) and filename.startswith(p):
break # inner loop over list of directories
# reset filename to None as sentinel for use below.
filename = None
# break out of outer loop over options
if filename:
break
if filename is None: # we didn't find a filename
raise NotFound(file)
# detemine meta-type
file = str(file)
mime_type = mimetypes.guess_type(file)[0]
if not mime_type:
mime_type = 'text/css' if file.endswith('.css') else 'text/plain'
# get filename: given a/b/c.js extract c.js
fn = file.rpartition("/")[2]
if fn in self.Cache_Control:
# if filename matches, don't use cache control
# for mime type.
self.additional_headers['Cache-Control'] = \
self.Cache_Control[fn]
elif mime_type in self.Cache_Control:
self.additional_headers['Cache-Control'] = \
self.Cache_Control[mime_type]
self._serve_file(None, None, mime_type, '', filename)
def _serve_file(self, lmt, etag, mime_type, content=None, filename=None):
"""guts of serve_file() and serve_static_file()
if lmt or etag are None, derive them from file filename.
Handles if-modified-since and if-none-match etag
conditional gets.
It produces an raw etag header without encoding suffix.
But it adds Accept-Encoding to the vary header.
"""
if filename:
stat_info = os.stat(filename)
if lmt is None:
# last-modified time
lmt = stat_info[stat.ST_MTIME]
if etag is None:
# FIXME: maybe etag should depend on encoding.
# it is an apache compatible etag without encoding.
etag = '"%x-%x-%x"' % (stat_info[stat.ST_INO],
stat_info[stat.ST_SIZE],
stat_info[stat.ST_MTIME])
# spit out headers for conditional request
self.setHeader("ETag", etag)
self.additional_headers['Last-Modified'] = \
email.utils.formatdate(lmt, usegmt=True)
inm = None
# ETag is a more strict check than modified date. Use etag
# check if available. Skip testing modified data.
if hasattr(self.request, 'headers'):
inm = self.request.headers.get('if-none-match')
elif 'HTTP_IF_NONE_MATCH' in self.env:
# maybe the cgi will put the header in the env var
inm = self.env['HTTP_IF_NONE_MATCH']
if inm and etag == inm:
# because we can compress, always set Accept-Encoding
# value. Otherwise caches can serve up the wrong info
# if their cached copy has no compression.
self.setVary("Accept-Encoding")
'''
to solve issue2551356 I may need to determine
the content encoding.
if (self.determine_content_encoding()):
'''
raise NotModified
if self.if_not_modified_since(lmt):
# because we can compress, always set Accept-Encoding
# value. Otherwise caches can serve up the wrong info
# if their cached copy has no compression.
self.setVary("Accept-Encoding")
'''
to solve issue2551356 I may need to determine
the content encoding.
if (self.determine_content_encoding()):
'''
raise NotModified
# don't set until we are sure we are sending a response body.
self.additional_headers['Content-Type'] = mime_type
if filename:
self.write_file(filename)
else:
self.additional_headers['Content-Length'] = str(len(content))
self.write(content)
def if_not_modified_since(self, lmt):
ims = None
# see if there's an if-modified-since...
if hasattr(self.request, 'headers'):
ims = self.request.headers.get('if-modified-since')
elif 'HTTP_IF_MODIFIED_SINCE' in self.env:
# cgi will put the header in the env var
ims = self.env['HTTP_IF_MODIFIED_SINCE']
if ims:
datestamp = email.utils.parsedate(ims)
if datestamp is not None:
ims = datestamp[:6]
else:
# set to beginning of time so whole file will be sent
ims = (0, 0, 0, 0, 0, 0)
lmtt = time.gmtime(lmt)[:6]
return lmtt <= ims
return False
def send_error_to_admin(self, subject, html, txt):
"""Send traceback information to admin via email.
We send both, the formatted html (with more information) and
the text version of the traceback. We use
multipart/alternative so the receiver can chose which version
to display.
"""
to = [self.mailer.config.ADMIN_EMAIL]
message = MIMEMultipart('alternative')
self.mailer.set_message_attributes(message, to, subject)
part = self.mailer.get_text_message('utf-8', 'html')
part.set_payload(html, part.get_charset())
message.attach(part)
part = self.mailer.get_text_message()
part.set_payload(txt, part.get_charset())
message.attach(part)
self.mailer.smtp_send(to, message.as_string())
def renderFrontPage(self, message):
"""Return the front page of the tracker."""
self.classname = self.nodeid = None
self.template = ''
self.add_error_message(message)
self.write_html(self.renderContext())
def selectTemplate(self, name, view):
""" Choose existing template for the given combination of
classname (name parameter) and template request variable
(view parameter) and return its name.
View can be a single template or two templates separated
by a vbar '|' character. If the Client object has a
non-empty _error_message attribute, the right hand
template (error template) will be used. If the
_error_message is empty, the left hand template (ok
template) will be used.
In most cases the name will be "classname.view", but
if "view" is None, then template name "classname" will
be returned.
If "classname.view" template doesn't exist, the
"_generic.view" is used as a fallback.
[ ] cover with tests
"""
# determine if view is oktmpl|errortmpl. If so assign the
# right one to the view parameter. If we don't have alternate
# templates, just leave view alone.
if (view and view.find('|') != -1):
# we have alternate templates, parse them apart.
(oktmpl, errortmpl) = view.split("|", 1)
# Choose the right template
view = errortmpl if self._error_message else oktmpl
loader = self.instance.templates
# if classname is not set, use "home" template
if name is None:
name = 'home'
tplname = name
if view:
# Support subdirectories for templates. Value is path/to/VIEW
# or just VIEW if the template is in the html directory of
# the tracker.
slash_loc = view.rfind("/")
if slash_loc == -1:
# try plain class.view
tplname = '%s.%s' % (name, view)
else:
# try path/class.view
tplname = '%s/%s.%s' % (
view[:slash_loc], name, view[slash_loc + 1:])
if loader.check(tplname):
return tplname
# rendering class/context with generic template for this view.
# with no view it's impossible to choose which generic template to use
if not view:
raise templating.NoTemplate('Template "%s" doesn\'t exist' % name)
if slash_loc == -1:
generic = '_generic.%s' % view
else:
generic = '%s/_generic.%s' % (view[:slash_loc], view[slash_loc + 1:])
if loader.check(generic):
return generic
raise templating.NoTemplate(
'No template file exists for templating '
'"%s" with template "%s" (neither "%s" nor "%s")' % (
name, view, tplname, generic))
def renderContext(self):
""" Return a PageTemplate for the named page
"""
try:
tplname = self.selectTemplate(self.classname, self.template)
# catch errors so we can handle PT rendering errors more nicely
args = {
'ok_message': self._ok_message,
'error_message': self._error_message,
}
pt = self.instance.templates.load(tplname)
# let the template render figure stuff out
try:
result = pt.render(self, None, None, **args)
except IndexerQueryError as e:
result = self.renderError(e.args[0])
except ExpressionError as e:
self.add_error_message(str(e))
self.template = "search"
result = self.renderContext()
if 'Content-Type' not in self.additional_headers:
self.additional_headers['Content-Type'] = pt.content_type
if self.env.get('CGI_SHOW_TIMING', ''):
if self.env['CGI_SHOW_TIMING'].upper() == 'COMMENT':
timings = {'starttag': ''}
else:
timings = {'starttag': '