Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

add brotli support #3235

Open
wants to merge 2 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Jump to
Jump to file
Failed to load files.
Diff view
Diff view
6 changes: 6 additions & 0 deletions setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -119,5 +119,11 @@ def get_tag(self):
"Programming Language :: Python :: Implementation :: CPython",
"Programming Language :: Python :: Implementation :: PyPy",
],
extras_require={
"brotli": [
"brotli; platform_python_implementation == 'CPython'",
"brotlicffi; platform_python_implementation != 'CPython'",
]
},
**kwargs
)
223 changes: 162 additions & 61 deletions tornado/web.py
Original file line number Diff line number Diff line change
Expand Up @@ -112,18 +112,20 @@ async def main():
url = URLSpec

from typing import (
Dict,
Any,
Union,
Optional,
Awaitable,
Tuple,
List,
Callable,
Iterable,
Dict,
FrozenSet,
Generator,
Iterable,
List,
MutableSequence,
Optional,
Tuple,
Type,
TypeVar,
Union,
cast,
overload,
)
Expand Down Expand Up @@ -2101,13 +2103,19 @@ def __init__(
self,
handlers: Optional[_RuleList] = None,
default_host: Optional[str] = None,
transforms: Optional[List[Type["OutputTransform"]]] = None,
transforms: Optional[
MutableSequence[Callable[[httputil.HTTPServerRequest], "OutputTransform"]]
] = None,
**settings: Any,
) -> None:
if transforms is None:
self.transforms = [] # type: List[Type[OutputTransform]]
if settings.get("compress_response") or settings.get("gzip"):
self.transforms.append(GZipContentEncoding)
self.transforms = (
[]
) # type: MutableSequence[Callable[[httputil.HTTPServerRequest], OutputTransform]]
if settings.get("compress_response"):
self.transforms = [CompressingOutputTransform]
elif settings.get("gzip"):
self.transforms = [GZipContentEncoding]
else:
self.transforms = transforms
self.default_host = default_host
Expand Down Expand Up @@ -3138,43 +3146,44 @@ def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
return chunk


class GZipContentEncoding(OutputTransform):
"""Applies the gzip content encoding to the response.

See http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.11

.. versionchanged:: 4.0
Now compresses all mime types beginning with ``text/``, instead
of just a whitelist. (the whitelist is still used for certain
non-text mime types).
"""
class _CompressingOutputTransformABC(OutputTransform):
"""ABC for classes that compress outputs."""

# Whitelist of compressible mime types (in addition to any types
# beginning with "text/").
CONTENT_TYPES = set(
[
"application/javascript",
"application/x-javascript",
"application/xml",
"application/atom+xml",
"application/json",
"application/xhtml+xml",
"image/svg+xml",
]
)
# Python's GzipFile defaults to level 9, while most other gzip
# tools (including gzip itself) default to 6, which is probably a
# better CPU/size tradeoff.
GZIP_LEVEL = 6
CONTENT_TYPES = {
"application/javascript",
"application/x-javascript",
"application/xml",
"application/atom+xml",
"application/json",
"application/xhtml+xml",
"image/svg+xml",
}
# Responses that are too short are unlikely to benefit from gzipping
# after considering the "Content-Encoding: gzip" header and the header
# inside the gzip encoding.
# Note that responses written in multiple chunks will be compressed
# regardless of size.
MIN_LENGTH = 1024

CONTENT_ENCODING: str = ""
"""The encoding used, in sub-classes it will be equal to CONTENT_ENCODING."""

_compressing: bool
"""If this is False the output will not be transformed."""

@staticmethod
def accepted_encodings(request: httputil.HTTPServerRequest) -> "FrozenSet[str]":
return frozenset(
map(
str.strip, request.headers.get("Accept-Encoding", "").lower().split(",")
)
)

def __init__(self, request: httputil.HTTPServerRequest) -> None:
self._gzipping = "gzip" in request.headers.get("Accept-Encoding", "")
super().__init__(request)
self._compressing = self.CONTENT_ENCODING in self.accepted_encodings(request)

def _compressible_type(self, ctype: str) -> bool:
return ctype.startswith("text/") or ctype in self.CONTENT_TYPES
Expand All @@ -3186,38 +3195,74 @@ def transform_first_chunk(
chunk: bytes,
finishing: bool,
) -> Tuple[int, httputil.HTTPHeaders, bytes]:
# TODO: can/should this type be inherited from the superclass?
if "Vary" in headers:
headers["Vary"] += ", Accept-Encoding"
else:
headers["Vary"] = "Accept-Encoding"
if self._gzipping:
ctype = _unicode(headers.get("Content-Type", "")).split(";")[0]
self._gzipping = (
self._compressible_type(ctype)
and (not finishing or len(chunk) >= self.MIN_LENGTH)
and ("Content-Encoding" not in headers)
)
if self._gzipping:
headers["Content-Encoding"] = "gzip"
self._gzip_value = BytesIO()
self._gzip_file = gzip.GzipFile(
mode="w", fileobj=self._gzip_value, compresslevel=self.GZIP_LEVEL
)
chunk = self.transform_chunk(chunk, finishing)
if "Content-Length" in headers:
# The original content length is no longer correct.
# If this is the last (and only) chunk, we can set the new
# content-length; otherwise we remove it and fall back to
# chunked encoding.
if finishing:
headers["Content-Length"] = str(len(chunk))
else:
del headers["Content-Length"]
if not self._compressing:
return status_code, headers, chunk
ctype = _unicode(headers.get("Content-Type", "")).split(";")[0]
if not (
self._compressible_type(ctype)
and (not finishing or len(chunk) >= self.MIN_LENGTH)
and ("Content-Encoding" not in headers)
):
self._compressing = False
return status_code, headers, chunk

headers["Content-Encoding"] = self.CONTENT_ENCODING

self.prepare_transform()

chunk = self.transform_chunk(chunk, finishing)
if "Content-Length" in headers:
# The original content length is no longer correct.
# If this is the last (and only) chunk, we can set the new
# content-length; otherwise we remove it and fall back to
# chunked encoding.
if finishing:
headers["Content-Length"] = str(len(chunk))
else:
del headers["Content-Length"]

return status_code, headers, chunk

def prepare_transform(self) -> None:
raise NotImplementedError()

def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
if self._gzipping:
raise NotImplementedError()


class GZipContentEncoding(_CompressingOutputTransformABC):
"""Applies the gzip content encoding to the response.

See http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.11

.. versionchanged:: 4.0
Now compresses all mime types beginning with ``text/``, instead
of just a whitelist. (the whitelist is still used for certain
non-text mime types).
"""

# Python's GzipFile defaults to level 9, while most other gzip
# tools (including gzip itself) default to 6, which is probably a
# better CPU/size tradeoff.
GZIP_LEVEL = 6

CONTENT_ENCODING = "gzip"

_gzip_value: BytesIO
_gzip_file: gzip.GzipFile

def prepare_transform(self) -> None:
self._gzip_value = BytesIO()
self._gzip_file = gzip.GzipFile(
mode="w", fileobj=self._gzip_value, compresslevel=self.GZIP_LEVEL
)

def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
if self._compressing:
self._gzip_file.write(chunk)
if finishing:
self._gzip_file.close()
Expand All @@ -3229,6 +3274,62 @@ def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
return chunk


class BrotliContentEncoding(_CompressingOutputTransformABC):
"""Compresses the response with brotli."""

CONTENT_ENCODING = "br"

# Python's Brotli defaults to level 11
BROTLI_LEVEL = 8

def prepare_transform(self) -> None:
self._compressor = brotli.Compressor(
mode=brotli.MODE_TEXT, quality=self.BROTLI_LEVEL, lgwin=22, lgblock=0
)

def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
if self._compressing:
chunk = self._compressor.process(chunk)
if finishing:
chunk += self._compressor.finish()
return chunk


try:
try:
import brotlicffi as brotli # type: ignore[import]
except ImportError:
import brotli # type: ignore[import]
except ImportError:
brotli = None
else:
pass


COMPRESSION_ALGORITHMS: "List[Tuple[str, Type[_CompressingOutputTransformABC]]]" = [
*([("br", BrotliContentEncoding)] if brotli else []),
("gzip", GZipContentEncoding),
]
"""The available compression algorithms sorted by preference."""


def CompressingOutputTransform(request: httputil.HTTPServerRequest) -> OutputTransform:
"""Applies the compression to the response."""
accepted_encodings = _CompressingOutputTransformABC.accepted_encodings(request)
compressing: "Optional[Type[_CompressingOutputTransformABC]]" = None
content_encoding: str = ""
for name, class_ in COMPRESSION_ALGORITHMS:
if name in accepted_encodings:
compressing = class_
content_encoding = name
break

if not compressing or not content_encoding:
return OutputTransform(request)

return compressing(request)


def authenticated(
method: Callable[..., Optional[Awaitable[None]]]
) -> Callable[..., Optional[Awaitable[None]]]:
Expand Down