tornadoweb · Joshix-1 · Feb 19, 2023 · Feb 19, 2023
diff --git a/setup.py b/setup.py
@@ -119,5 +119,11 @@ def get_tag(self):
         "Programming Language :: Python :: Implementation :: CPython",
         "Programming Language :: Python :: Implementation :: PyPy",
     ],
+    extras_require={
+        "brotli": [
+            "brotli; platform_python_implementation == 'CPython'",
+            "brotlicffi; platform_python_implementation != 'CPython'",
+        ]
+    },
     **kwargs
 )
diff --git a/tornado/web.py b/tornado/web.py
@@ -112,18 +112,20 @@ async def main():
 url = URLSpec
 
 from typing import (
-    Dict,
     Any,
-    Union,
-    Optional,
     Awaitable,
-    Tuple,
-    List,
     Callable,
-    Iterable,
+    Dict,
+    FrozenSet,
     Generator,
+    Iterable,
+    List,
+    MutableSequence,
+    Optional,
+    Tuple,
     Type,
     TypeVar,
+    Union,
     cast,
     overload,
 )
@@ -2101,13 +2103,19 @@ def __init__(
         self,
         handlers: Optional[_RuleList] = None,
         default_host: Optional[str] = None,
-        transforms: Optional[List[Type["OutputTransform"]]] = None,
+        transforms: Optional[
+            MutableSequence[Callable[[httputil.HTTPServerRequest], "OutputTransform"]]
+        ] = None,
         **settings: Any,
     ) -> None:
         if transforms is None:
-            self.transforms = []  # type: List[Type[OutputTransform]]
-            if settings.get("compress_response") or settings.get("gzip"):
-                self.transforms.append(GZipContentEncoding)
+            self.transforms = (
+                []
+            )  # type: MutableSequence[Callable[[httputil.HTTPServerRequest], OutputTransform]]
+            if settings.get("compress_response"):
+                self.transforms = [CompressingOutputTransform]
+            elif settings.get("gzip"):
+                self.transforms = [GZipContentEncoding]
         else:
             self.transforms = transforms
         self.default_host = default_host
@@ -3138,43 +3146,44 @@ def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
         return chunk
 
 
-class GZipContentEncoding(OutputTransform):
-    """Applies the gzip content encoding to the response.
-
-    See http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.11
-
-    .. versionchanged:: 4.0
-        Now compresses all mime types beginning with ``text/``, instead
-        of just a whitelist. (the whitelist is still used for certain
-        non-text mime types).
-    """
+class _CompressingOutputTransformABC(OutputTransform):
+    """ABC for classes that compress outputs."""
 
     # Whitelist of compressible mime types (in addition to any types
     # beginning with "text/").
-    CONTENT_TYPES = set(
-        [
-            "application/javascript",
-            "application/x-javascript",
-            "application/xml",
-            "application/atom+xml",
-            "application/json",
-            "application/xhtml+xml",
-            "image/svg+xml",
-        ]
-    )
-    # Python's GzipFile defaults to level 9, while most other gzip
-    # tools (including gzip itself) default to 6, which is probably a
-    # better CPU/size tradeoff.
-    GZIP_LEVEL = 6
+    CONTENT_TYPES = {
+        "application/javascript",
+        "application/x-javascript",
+        "application/xml",
+        "application/atom+xml",
+        "application/json",
+        "application/xhtml+xml",
+        "image/svg+xml",
+    }
     # Responses that are too short are unlikely to benefit from gzipping
     # after considering the "Content-Encoding: gzip" header and the header
     # inside the gzip encoding.
     # Note that responses written in multiple chunks will be compressed
     # regardless of size.
     MIN_LENGTH = 1024
 
+    CONTENT_ENCODING: str = ""
+    """The encoding used, in sub-classes it will be equal to CONTENT_ENCODING."""
+
+    _compressing: bool
+    """If this is False the output will not be transformed."""
+
+    @staticmethod
+    def accepted_encodings(request: httputil.HTTPServerRequest) -> "FrozenSet[str]":
+        return frozenset(
+            map(
+                str.strip, request.headers.get("Accept-Encoding", "").lower().split(",")
+            )
+        )
+
     def __init__(self, request: httputil.HTTPServerRequest) -> None:
-        self._gzipping = "gzip" in request.headers.get("Accept-Encoding", "")
+        super().__init__(request)
+        self._compressing = self.CONTENT_ENCODING in self.accepted_encodings(request)
 
     def _compressible_type(self, ctype: str) -> bool:
         return ctype.startswith("text/") or ctype in self.CONTENT_TYPES
@@ -3186,38 +3195,74 @@ def transform_first_chunk(
         chunk: bytes,
         finishing: bool,
     ) -> Tuple[int, httputil.HTTPHeaders, bytes]:
-        # TODO: can/should this type be inherited from the superclass?
         if "Vary" in headers:
             headers["Vary"] += ", Accept-Encoding"
         else:
             headers["Vary"] = "Accept-Encoding"
-        if self._gzipping:
-            ctype = _unicode(headers.get("Content-Type", "")).split(";")[0]
-            self._gzipping = (
-                self._compressible_type(ctype)
-                and (not finishing or len(chunk) >= self.MIN_LENGTH)
-                and ("Content-Encoding" not in headers)
-            )
-        if self._gzipping:
-            headers["Content-Encoding"] = "gzip"
-            self._gzip_value = BytesIO()
-            self._gzip_file = gzip.GzipFile(
-                mode="w", fileobj=self._gzip_value, compresslevel=self.GZIP_LEVEL
-            )
-            chunk = self.transform_chunk(chunk, finishing)
-            if "Content-Length" in headers:
-                # The original content length is no longer correct.
-                # If this is the last (and only) chunk, we can set the new
-                # content-length; otherwise we remove it and fall back to
-                # chunked encoding.
-                if finishing:
-                    headers["Content-Length"] = str(len(chunk))
-                else:
-                    del headers["Content-Length"]
+        if not self._compressing:
+            return status_code, headers, chunk
+        ctype = _unicode(headers.get("Content-Type", "")).split(";")[0]
+        if not (
+            self._compressible_type(ctype)
+            and (not finishing or len(chunk) >= self.MIN_LENGTH)
+            and ("Content-Encoding" not in headers)
+        ):
+            self._compressing = False
+            return status_code, headers, chunk
+
+        headers["Content-Encoding"] = self.CONTENT_ENCODING
+
+        self.prepare_transform()
+
+        chunk = self.transform_chunk(chunk, finishing)
+        if "Content-Length" in headers:
+            # The original content length is no longer correct.
+            # If this is the last (and only) chunk, we can set the new
+            # content-length; otherwise we remove it and fall back to
+            # chunked encoding.
+            if finishing:
+                headers["Content-Length"] = str(len(chunk))
+            else:
+                del headers["Content-Length"]
+
         return status_code, headers, chunk
 
+    def prepare_transform(self) -> None:
+        raise NotImplementedError()
+
     def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
-        if self._gzipping:
+        raise NotImplementedError()
+
+
+class GZipContentEncoding(_CompressingOutputTransformABC):
+    """Applies the gzip content encoding to the response.
+
+    See http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.11
+
+    .. versionchanged:: 4.0
+        Now compresses all mime types beginning with ``text/``, instead
+        of just a whitelist. (the whitelist is still used for certain
+        non-text mime types).
+    """
+
+    # Python's GzipFile defaults to level 9, while most other gzip
+    # tools (including gzip itself) default to 6, which is probably a
+    # better CPU/size tradeoff.
+    GZIP_LEVEL = 6
+
+    CONTENT_ENCODING = "gzip"
+
+    _gzip_value: BytesIO
+    _gzip_file: gzip.GzipFile
+
+    def prepare_transform(self) -> None:
+        self._gzip_value = BytesIO()
+        self._gzip_file = gzip.GzipFile(
+            mode="w", fileobj=self._gzip_value, compresslevel=self.GZIP_LEVEL
+        )
+
+    def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
+        if self._compressing:
             self._gzip_file.write(chunk)
             if finishing:
                 self._gzip_file.close()
@@ -3229,6 +3274,62 @@ def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
         return chunk
 
 
+class BrotliContentEncoding(_CompressingOutputTransformABC):
+    """Compresses the response with brotli."""
+
+    CONTENT_ENCODING = "br"
+
+    # Python's Brotli defaults to level 11
+    BROTLI_LEVEL = 8
+
+    def prepare_transform(self) -> None:
+        self._compressor = brotli.Compressor(
+            mode=brotli.MODE_TEXT, quality=self.BROTLI_LEVEL, lgwin=22, lgblock=0
+        )
+
+    def transform_chunk(self, chunk: bytes, finishing: bool) -> bytes:
+        if self._compressing:
+            chunk = self._compressor.process(chunk)
+            if finishing:
+                chunk += self._compressor.finish()
+        return chunk
+
+
+try:
+    try:
+        import brotlicffi as brotli  # type: ignore[import]
+    except ImportError:
+        import brotli  # type: ignore[import]
+except ImportError:
+    brotli = None
+else:
+    pass
+
+
+COMPRESSION_ALGORITHMS: "List[Tuple[str, Type[_CompressingOutputTransformABC]]]" = [
+    *([("br", BrotliContentEncoding)] if brotli else []),
+    ("gzip", GZipContentEncoding),
+]
+"""The available compression algorithms sorted by preference."""
+
+
+def CompressingOutputTransform(request: httputil.HTTPServerRequest) -> OutputTransform:
+    """Applies the compression to the response."""
+    accepted_encodings = _CompressingOutputTransformABC.accepted_encodings(request)
+    compressing: "Optional[Type[_CompressingOutputTransformABC]]" = None
+    content_encoding: str = ""
+    for name, class_ in COMPRESSION_ALGORITHMS:
+        if name in accepted_encodings:
+            compressing = class_
+            content_encoding = name
+            break
+
+    if not compressing or not content_encoding:
+        return OutputTransform(request)
+
+    return compressing(request)
+
+
 def authenticated(
     method: Callable[..., Optional[Awaitable[None]]]
 ) -> Callable[..., Optional[Awaitable[None]]]: