Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[THREESCALE-9542] Part 2: Add support to proxy request with Transfer-Encoding: chunked #1403

Merged
merged 8 commits into from
Jan 22, 2024
2 changes: 2 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,8 @@ and this project adheres to [Semantic Versioning](http://semver.org/).

- Fixed CVE-2023-44487 (HTTP/2 Rapid Reset) [PR #1417](/~https://github.com/3scale/apicast/pull/1417) [THREESCALE-10224](https://issues.redhat.com/browse/THREESCALE-10224)

- Fixed issue where the proxy policy could not handle requests with "Transfer-Encoding: chunked" header [PR #1403](/~https://github.com/3scale/APIcast/pull/1403) [THREESCALE-9542](https://issues.redhat.com/browse/THREESCALE-9542)

### Added

- Detect number of CPU shares when running on Cgroups V2 [PR #1410](/~https://github.com/3scale/apicast/pull/1410) [THREESCALE-10167](https://issues.redhat.com/browse/THREESCALE-10167)
Expand Down
148 changes: 121 additions & 27 deletions gateway/src/apicast/http_proxy.lua
Original file line number Diff line number Diff line change
@@ -1,14 +1,30 @@
local format = string.format
local tostring = tostring
local ngx_flush = ngx.flush
local ngx_get_method = ngx.req.get_method
local ngx_http_version = ngx.req.http_version
local ngx_send_headers = ngx.send_headers

local resty_url = require "resty.url"
local resty_resolver = require 'resty.resolver'
local round_robin = require 'resty.balancer.round_robin'
local http_proxy = require 'resty.http.proxy'
local file_reader = require("resty.file").file_reader
local file_size = require("resty.file").file_size
local client_body_reader = require("resty.http.request_reader").get_client_body_reader
local send_response = require("resty.http.response_writer").send_response
local concat = table.concat

local _M = { }

local http_methods_with_body = {
POST = true,
PUT = true,
PATCH = true

Check warning on line 23 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L23

Added line #L23 was not covered by tests
}

local DEFAULT_CHUNKSIZE = 32 * 1024

function _M.reset()
_M.balancer = round_robin.new()
_M.resolver = resty_resolver
Expand Down Expand Up @@ -82,15 +98,50 @@
)
end

local function forward_https_request(proxy_uri, proxy_auth, uri, skip_https_connect)
-- This is needed to call ngx.req.get_body_data() below.
ngx.req.read_body()
local function forward_https_request(proxy_uri, uri, proxy_opts)
local body, err
local sock
local opts = proxy_opts or {}
local req_method = ngx_get_method()
local encoding = ngx.req.get_headers()["Transfer-Encoding"]
local is_chunked = encoding and encoding:lower() == "chunked"
local content_type = ngx.req.get_headers()["Content-Type"]
local content_type_is_urlencoded = content_type and content_type:lower() == "application/x-www-form-urlencoded"
local raw = false

Check warning on line 110 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L104-L110

Added lines #L104 - L110 were not covered by tests

if http_methods_with_body[req_method] then

Check warning on line 112 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L112

Added line #L112 was not covered by tests

-- When the content type is "application/x-www-form-urlencoded" the body is always pre-read.
-- See: gateway/src/apicast/configuration/service.lua:214
--
-- Due to this, ngx.req.socket() will fail with "request body already exists" error or return
-- socket but hang on read in case of raw socket. Therefore, we only retrieve body from the
-- socket if the content type is not "application/x-www-form-urlencoded"
if opts.request_unbuffered and ngx_http_version() == 1.1 and not content_type_is_urlencoded then
if is_chunked then

Check warning on line 121 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L120-L121

Added lines #L120 - L121 were not covered by tests
-- The default ngx reader does not support chunked request
-- so we will need to get the raw request socket and manually
-- decode the chunked request
sock, err = ngx.req.socket(true)
raw = true

Check warning on line 126 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L125-L126

Added lines #L125 - L126 were not covered by tests
else
sock, err = ngx.req.socket()

Check warning on line 128 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L128

Added line #L128 was not covered by tests
end

local request = {
uri = uri,
method = ngx.req.get_method(),
headers = ngx.req.get_headers(0, true),
path = format('%s%s%s', ngx.var.uri, ngx.var.is_args, ngx.var.query_string or ''),
if not sock then
ngx.log(ngx.ERR, "unable to obtain request socket: ", err)
return ngx.exit(ngx.HTTP_INTERNAL_SERVER_ERROR)

Check warning on line 133 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L131-L133

Added lines #L131 - L133 were not covered by tests
end

body = client_body_reader(sock, DEFAULT_CHUNKSIZE, is_chunked)

Check warning on line 136 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L136

Added line #L136 was not covered by tests
else
-- TODO: Due to ngx.req.read_body(). The current implementation will not work with grpc service
-- See: /~https://github.com/3scale/APIcast/pull/1419
-- Should we get the body from socket by default and only read buffered body if
-- "Content-Type: application/x-www-form-urlencoded"?
--
-- This is needed to call ngx.req.get_body_data() below.
ngx.req.read_body()

Check warning on line 144 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L144

Added line #L144 was not covered by tests

-- We cannot use resty.http's .get_client_body_reader().
-- In POST requests with HTTPS, the result of that call is nil, and it
Expand All @@ -101,26 +152,55 @@
-- read and need to be cached in a local file. This request will return
-- nil, so after this we need to read the temp file.
-- /~https://github.com/openresty/lua-nginx-module#ngxreqget_body_data
body = ngx.req.get_body_data(),
proxy_uri = proxy_uri,
proxy_auth = proxy_auth
}
body = ngx.req.get_body_data()

Check warning on line 155 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L155

Added line #L155 was not covered by tests

if not body then
local temp_file_path = ngx.req.get_body_file()
ngx.log(ngx.INFO, "HTTPS Proxy: Request body is bigger than client_body_buffer_size, read the content from path='", temp_file_path, "'")

Check warning on line 159 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L157-L159

Added lines #L157 - L159 were not covered by tests

if temp_file_path then
body, err = file_reader(temp_file_path)
if err then
ngx.log(ngx.ERR, "HTTPS proxy: Failed to read temp body file, err: ", err)
ngx.exit(ngx.HTTP_INTERNAL_SERVER_ERROR)

Check warning on line 165 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L161-L165

Added lines #L161 - L165 were not covered by tests
end

if is_chunked then

Check warning on line 168 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L168

Added line #L168 was not covered by tests
-- If the body is smaller than "client_boby_buffer_size" the Content-Length header is
-- set by openresty based on the size of the buffer. However, when the body is rendered
-- to a file, we will need to calculate and manually set the Content-Length header based
-- on the file size
local contentLength, err = file_size(temp_file_path)()
if err then
ngx.log(ngx.ERR, "HTTPS proxy: Failed to set content length, err: ", err)
ngx.exit(ngx.HTTP_INTERNAL_SERVER_ERROR)

Check warning on line 176 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L173-L176

Added lines #L173 - L176 were not covered by tests
end

ngx.req.set_header("Content-Length", tostring(contentLength))

Check warning on line 179 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L179

Added line #L179 was not covered by tests
end
end
end

if not request.body then
local temp_file_path = ngx.req.get_body_file()
ngx.log(ngx.INFO, "HTTPS Proxy: Request body is bigger than client_body_buffer_size, read the content from path='", temp_file_path, "'")

if temp_file_path then
local body, err = file_reader(temp_file_path)
if err then
ngx.log(ngx.ERR, "HTTPS proxy: Failed to read temp body file, err: ", err)
ngx.exit(ngx.HTTP_INTERNAL_SERVER_ERROR)
end
request.body = body
-- The whole request is buffered with chunked encoding removed, so remove the Transfer-Encoding: chunked
-- header, otherwise the upstream won't be able to read the body as it expected chunk encoded
-- body
if is_chunked then
ngx.req.set_header("Transfer-Encoding", nil)

Check warning on line 188 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L187-L188

Added lines #L187 - L188 were not covered by tests
end
end
end

local httpc, err = http_proxy.new(request, skip_https_connect)
local request = {

Check warning on line 193 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L193

Added line #L193 was not covered by tests
uri = uri,
method = ngx.req.get_method(),
headers = ngx.req.get_headers(0, true),
path = format('%s%s%s', ngx.var.uri, ngx.var.is_args, ngx.var.query_string or ''),
body = body,
proxy_uri = proxy_uri,
proxy_auth = opts.proxy_auth

Check warning on line 200 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L200

Added line #L200 was not covered by tests
}

local httpc, err = http_proxy.new(request, opts.skip_https_connect)

Check warning on line 203 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L203

Added line #L203 was not covered by tests

if not httpc then
ngx.log(ngx.ERR, 'could not connect to proxy: ', proxy_uri, ' err: ', err)
Expand All @@ -132,8 +212,16 @@
res, err = httpc:request(request)

if res then
httpc:proxy_response(res)
httpc:set_keepalive()
if opts.request_unbuffered and raw then
local bytes, err = send_response(sock, res, DEFAULT_CHUNKSIZE)
if not bytes then
ngx.log(ngx.ERR, "failed to send response: ", err)
return sock:send("HTTP/1.1 502 Bad Gateway")

Check warning on line 219 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L215-L219

Added lines #L215 - L219 were not covered by tests
end
else
httpc:proxy_response(res)
httpc:set_keepalive()

Check warning on line 223 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L222-L223

Added lines #L222 - L223 were not covered by tests
end
else
ngx.log(ngx.ERR, 'failed to proxy request to: ', proxy_uri, ' err : ', err)
return ngx.exit(ngx.HTTP_BAD_GATEWAY)
Expand Down Expand Up @@ -186,7 +274,13 @@
return
elseif uri.scheme == 'https' then
upstream:rewrite_request()
forward_https_request(proxy_uri, proxy_auth, uri, upstream.skip_https_connect)
local proxy_opts = {

Check warning on line 277 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L277

Added line #L277 was not covered by tests
proxy_auth = proxy_auth,
skip_https_connect = upstream.skip_https_connect,
request_unbuffered = upstream.request_unbuffered

Check warning on line 280 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L280

Added line #L280 was not covered by tests
}

forward_https_request(proxy_uri, uri, proxy_opts)

Check warning on line 283 in gateway/src/apicast/http_proxy.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/apicast/http_proxy.lua#L283

Added line #L283 was not covered by tests
return ngx.exit(ngx.OK) -- terminate phase
else
ngx.log(ngx.ERR, 'could not connect to proxy: ', proxy_uri, ' err: ', 'invalid request scheme')
Expand Down
97 changes: 91 additions & 6 deletions gateway/src/apicast/policy/request_unbuffered/README.md
Original file line number Diff line number Diff line change
@@ -1,14 +1,99 @@
# APICast Request Unbuffered

This policy allows to disable request buffering
## Description

When enable this policy will dymanically sets the [`proxy_request_buffering: off`](https://nginx.org/en/docs/http/ngx_http_proxy_module.html#proxy_request_buffering
) directive per service.


## Technical details

By default, NGINX reads the entire request body into memory (or buffers large requests into disk) before proxying it to the upstream server. However, reading bodies can become expensive, especially when requests with large payloads are sent.
Copy link
Contributor

@dfennessy dfennessy Jan 19, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
By default, NGINX reads the entire request body into memory (or buffers large requests into disk) before proxying it to the upstream server. However, reading bodies can become expensive, especially when requests with large payloads are sent.
By default, NGINX reads the entire request body into memory or buffers large requests to disk before forwarding them to the upstream server. Reading bodies can become expensive, especially when sending requests containing large payloads.


For example, when the client sends 10GB, NGINX will buffer the entire 10GB to disk before sending anything to
the upstream server.

When `proxy_request_buffering` is in the chain, request buffering will be disabled and the request body will be sent to the proxied server immediately as it received. This can help minimize time spent sending data to a service and disk I/O for requests with big body. However, there are caveats and corner cases applied, [**Caveats**](#caveats)
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

proxy_request_buffering is not the name of the policy, is it?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

oops

Copy link
Contributor

@dfennessy dfennessy Jan 19, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
When `proxy_request_buffering` is in the chain, request buffering will be disabled and the request body will be sent to the proxied server immediately as it received. This can help minimize time spent sending data to a service and disk I/O for requests with big body. However, there are caveats and corner cases applied, [**Caveats**](#caveats)
When the `proxy_request_buffering` is in the chain, request buffering is disabled, sending the request body to the proxied server immediately upon receiving it. This can help minimize time spent sending data to a service and disk I/O for requests with big body. However, there are caveats and corner cases applied, [**Caveats**](#caveats)


The policy also provides a consistent behavior across multiple scenarios like:

```
- APIcast <> upstream HTTP 1.1 plain
- APIcast <> upstream TLS
- APIcast <> HTTP Proxy (env var) <> upstream HTTP 1.1 plain
- APIcast <> HTTP Proxy (policy) <> upstream HTTP 1.1 plain
- APIcast <> HTTP Proxy (camel proxy) <> upstream HTTP 1.1 plain
- APIcast <> HTTP Proxy (env var) <> upstream TLS
- APIcast <> HTTP Proxy (policy) <> upstream TLS
- APIcast <> HTTP Proxy (camel proxy) <> upstream TLS
```

## Why don't we also support disable response buffering?

The response buffering is enabled by default in NGINX (the [`proxy_buffering: on`]() directive). It does
this to shield the backend against slow clients ([slowloris attack](https://en.wikipedia.org/wiki/Slowloris_(computer_security))).

If the `proxy_buffering` is disabled, the upstream server will be forced to keep the connection open until all data has been received by the client. Thereforce, NGINX [advises](https://www.nginx.com/blog/avoiding-top-10-nginx-configuration-mistakes/#proxy_buffering-off) against disabling `proxy_buffering` as it will potentially waste upstream server resources.
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
If the `proxy_buffering` is disabled, the upstream server will be forced to keep the connection open until all data has been received by the client. Thereforce, NGINX [advises](https://www.nginx.com/blog/avoiding-top-10-nginx-configuration-mistakes/#proxy_buffering-off) against disabling `proxy_buffering` as it will potentially waste upstream server resources.
If the `proxy_buffering` is disabled, the upstream server keeps the connection open until all data is received by the client. NGINX [advises](https://www.nginx.com/blog/avoiding-top-10-nginx-configuration-mistakes/#proxy_buffering-off) against disabling `proxy_buffering` as it will potentially waste upstream server resources.


## Example configuration

```
{
"name": "request_unbuffered",
"version": "builtin",
"configuration": {}
}
"policy_chain": [
{
"name": "request_unbuffered",
"version": "builtin",
},
{
"name": "apicast.policy.apicast"
}
]
```

Use with Proxy policy

```
"policy_chain": [
{
"name": "request_unbuffered",
"version": "builtin",
},
{
"name": "apicast.policy.http_proxy",
"configuration": {
"all_proxy": "http://foo:bar@192.168.15.103:8888/",
"https_proxy": "http://192.168.15.103:8888/",
"http_proxy": "http://192.168.15.103:8888/"
}
}
]
```

Use with Camel Proxy policy

```
"policy_chain": [
{
"name": "request_unbuffered",
"version": "builtin",
},
{
"name": "apicast.policy.camel",
"configuration": {
"http_proxy": "http://192.168.15.103:8080/",
"https_proxy": "http://192.168.15.103:8443/",
"all_proxy": "http://192.168.15.103:8080/"
}
}
]
```

## Caveats

- Because APIcast allows defining mapping rules based on request content, ie `POST /some_path?a_param={a_value}`
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
- Because APIcast allows defining mapping rules based on request content, ie `POST /some_path?a_param={a_value}`
- APIcast allows defining of mapping rules based on request content. For example, `POST /some_path?a_param={a_value}`

will match a request like `POST "http://apicast_host:8080/some_path"` with a form URL-encoded body like: `a_param=abc`
, requests with `Content-type: application/x-www-form-urlencoded` will always be buffered regardless of the
`request_unbuffered` policy is enabled or not.
- For a request with "small" body that fits into [`client_body_buffer_size`](https://nginx.org/en/docs/http/ngx_http_core_module.html#client_body_buffer_size) and with header "Transfer-Encoding: chunked", NGINX will always read and know the length of the body.
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is nice to note, but it is not a caveat (a limitation), it is expected and correct. All about unbuffered request is the fact, as you correctly pointed out, that the request body will be sent to the proxied server immediately as it received. The transfer encoding is HOP-BY-HOP encoding and nothing prevents from changing it from one hop to the next one.

Then it will send the request to upstream with the "Content-Length" header.
- If a client uses chunked transfer encoding with HTTP/1.0, NGINX will always buffer the request body
- Disable request buffering could potentially expose the backend to [slowloris attack](https://en.wikipedia.org/wiki/Slowloris_(computer_security)). Therefore, we recommend to only use this policy when needed.
1 change: 1 addition & 0 deletions gateway/src/apicast/upstream.lua
Original file line number Diff line number Diff line change
Expand Up @@ -241,6 +241,7 @@ function _M:call(context)
self:set_skip_https_connect_on_proxy();
end

self.request_unbuffered = context.request_unbuffered
http_proxy.request(self, proxy_uri)
else
local err = self:rewrite_request()
Expand Down
19 changes: 19 additions & 0 deletions gateway/src/resty/file.lua
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
local co_yield = coroutine._yield
local co_wrap = coroutine._wrap
local open = io.open

local co_wrap_iter = require("resty.coroutines").co_wrap_iter
Expand Down Expand Up @@ -28,4 +29,22 @@
end)
end

function _M.file_size(filename)
return co_wrap(function()
local handle, err = open(filename)

Check warning on line 34 in gateway/src/resty/file.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/resty/file.lua#L33-L34

Added lines #L33 - L34 were not covered by tests

if err then
return nil, err

Check warning on line 37 in gateway/src/resty/file.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/resty/file.lua#L36-L37

Added lines #L36 - L37 were not covered by tests
end

local current = handle:seek()
local size = handle:seek("end")

Check warning on line 41 in gateway/src/resty/file.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/resty/file.lua#L40-L41

Added lines #L40 - L41 were not covered by tests

handle:seek("set", current)
handle:close()

Check warning on line 44 in gateway/src/resty/file.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/resty/file.lua#L43-L44

Added lines #L43 - L44 were not covered by tests

return size

Check warning on line 46 in gateway/src/resty/file.lua

View check run for this annotation

Codecov / codecov/patch

gateway/src/resty/file.lua#L46

Added line #L46 was not covered by tests
end)
end

return _M
Loading
Loading