1 /*
2 *
3 * Copyright 2017 gRPC authors.
4 *
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 *
17 */
18
19 #include <grpc/support/port_platform.h>
20
21 #include "src/core/ext/transport/chttp2/transport/flow_control.h"
22
23 #include <inttypes.h>
24 #include <limits.h>
25 #include <math.h>
26 #include <string.h>
27
28 #include <grpc/support/alloc.h>
29 #include <grpc/support/log.h>
30 #include <grpc/support/string_util.h>
31
32 #include "src/core/ext/transport/chttp2/transport/internal.h"
33 #include "src/core/lib/gpr/string.h"
34
35 grpc_core::TraceFlag grpc_flowctl_trace(false, "flowctl");
36
37 namespace grpc_core {
38 namespace chttp2 {
39
40 namespace {
41
42 static constexpr const int kTracePadding = 30;
43 static constexpr const uint32_t kMaxWindowUpdateSize = (1u << 31) - 1;
44
fmt_int64_diff_str(int64_t old_val,int64_t new_val)45 static char* fmt_int64_diff_str(int64_t old_val, int64_t new_val) {
46 char* str;
47 if (old_val != new_val) {
48 gpr_asprintf(&str, "%" PRId64 " -> %" PRId64 "", old_val, new_val);
49 } else {
50 gpr_asprintf(&str, "%" PRId64 "", old_val);
51 }
52 char* str_lp = gpr_leftpad(str, ' ', kTracePadding);
53 gpr_free(str);
54 return str_lp;
55 }
56
fmt_uint32_diff_str(uint32_t old_val,uint32_t new_val)57 static char* fmt_uint32_diff_str(uint32_t old_val, uint32_t new_val) {
58 char* str;
59 if (old_val != new_val) {
60 gpr_asprintf(&str, "%" PRIu32 " -> %" PRIu32 "", old_val, new_val);
61 } else {
62 gpr_asprintf(&str, "%" PRIu32 "", old_val);
63 }
64 char* str_lp = gpr_leftpad(str, ' ', kTracePadding);
65 gpr_free(str);
66 return str_lp;
67 }
68 } // namespace
69
Init(const char * reason,TransportFlowControl * tfc,StreamFlowControl * sfc)70 void FlowControlTrace::Init(const char* reason, TransportFlowControl* tfc,
71 StreamFlowControl* sfc) {
72 tfc_ = tfc;
73 sfc_ = sfc;
74 reason_ = reason;
75 remote_window_ = tfc->remote_window();
76 target_window_ = tfc->target_window();
77 announced_window_ = tfc->announced_window();
78 if (sfc != nullptr) {
79 remote_window_delta_ = sfc->remote_window_delta();
80 local_window_delta_ = sfc->local_window_delta();
81 announced_window_delta_ = sfc->announced_window_delta();
82 }
83 }
84
Finish()85 void FlowControlTrace::Finish() {
86 uint32_t acked_local_window =
87 tfc_->transport()->settings[GRPC_SENT_SETTINGS]
88 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
89 uint32_t remote_window =
90 tfc_->transport()->settings[GRPC_PEER_SETTINGS]
91 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
92 char* trw_str = fmt_int64_diff_str(remote_window_, tfc_->remote_window());
93 char* tlw_str = fmt_int64_diff_str(target_window_, tfc_->target_window());
94 char* taw_str =
95 fmt_int64_diff_str(announced_window_, tfc_->announced_window());
96 char* srw_str;
97 char* slw_str;
98 char* saw_str;
99 if (sfc_ != nullptr) {
100 srw_str = fmt_int64_diff_str(remote_window_delta_ + remote_window,
101 sfc_->remote_window_delta() + remote_window);
102 slw_str =
103 fmt_int64_diff_str(local_window_delta_ + acked_local_window,
104 sfc_->local_window_delta() + acked_local_window);
105 saw_str =
106 fmt_int64_diff_str(announced_window_delta_ + acked_local_window,
107 sfc_->announced_window_delta() + acked_local_window);
108 } else {
109 srw_str = gpr_leftpad("", ' ', kTracePadding);
110 slw_str = gpr_leftpad("", ' ', kTracePadding);
111 saw_str = gpr_leftpad("", ' ', kTracePadding);
112 }
113 gpr_log(GPR_DEBUG,
114 "%p[%u][%s] | %s | trw:%s, ttw:%s, taw:%s, srw:%s, slw:%s, saw:%s",
115 tfc_, sfc_ != nullptr ? sfc_->stream()->id : 0,
116 tfc_->transport()->is_client ? "cli" : "svr", reason_, trw_str,
117 tlw_str, taw_str, srw_str, slw_str, saw_str);
118 gpr_free(trw_str);
119 gpr_free(tlw_str);
120 gpr_free(taw_str);
121 gpr_free(srw_str);
122 gpr_free(slw_str);
123 gpr_free(saw_str);
124 }
125
UrgencyString(Urgency u)126 const char* FlowControlAction::UrgencyString(Urgency u) {
127 switch (u) {
128 case Urgency::NO_ACTION_NEEDED:
129 return "no action";
130 case Urgency::UPDATE_IMMEDIATELY:
131 return "update immediately";
132 case Urgency::QUEUE_UPDATE:
133 return "queue update";
134 default:
135 GPR_UNREACHABLE_CODE(return "unknown");
136 }
137 GPR_UNREACHABLE_CODE(return "unknown");
138 }
139
Trace(grpc_chttp2_transport * t) const140 void FlowControlAction::Trace(grpc_chttp2_transport* t) const {
141 char* iw_str = fmt_uint32_diff_str(
142 t->settings[GRPC_SENT_SETTINGS][GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE],
143 initial_window_size_);
144 char* mf_str = fmt_uint32_diff_str(
145 t->settings[GRPC_SENT_SETTINGS][GRPC_CHTTP2_SETTINGS_MAX_FRAME_SIZE],
146 max_frame_size_);
147 gpr_log(GPR_DEBUG, "t[%s], s[%s], iw:%s:%s mf:%s:%s",
148 UrgencyString(send_transport_update_),
149 UrgencyString(send_stream_update_),
150 UrgencyString(send_initial_window_update_), iw_str,
151 UrgencyString(send_max_frame_size_update_), mf_str);
152 gpr_free(iw_str);
153 gpr_free(mf_str);
154 }
155
TransportFlowControlDisabled(grpc_chttp2_transport * t)156 TransportFlowControlDisabled::TransportFlowControlDisabled(
157 grpc_chttp2_transport* t) {
158 remote_window_ = kMaxWindow;
159 target_initial_window_size_ = kMaxWindow;
160 announced_window_ = kMaxWindow;
161 t->settings[GRPC_PEER_SETTINGS][GRPC_CHTTP2_SETTINGS_MAX_FRAME_SIZE] =
162 kFrameSize;
163 t->settings[GRPC_SENT_SETTINGS][GRPC_CHTTP2_SETTINGS_MAX_FRAME_SIZE] =
164 kFrameSize;
165 t->settings[GRPC_ACKED_SETTINGS][GRPC_CHTTP2_SETTINGS_MAX_FRAME_SIZE] =
166 kFrameSize;
167 t->settings[GRPC_PEER_SETTINGS][GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE] =
168 kMaxWindow;
169 t->settings[GRPC_SENT_SETTINGS][GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE] =
170 kMaxWindow;
171 t->settings[GRPC_ACKED_SETTINGS][GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE] =
172 kMaxWindow;
173 }
174
TransportFlowControl(const grpc_chttp2_transport * t,bool enable_bdp_probe)175 TransportFlowControl::TransportFlowControl(const grpc_chttp2_transport* t,
176 bool enable_bdp_probe)
177 : t_(t),
178 enable_bdp_probe_(enable_bdp_probe),
179 bdp_estimator_(t->peer_string),
180 pid_controller_(grpc_core::PidController::Args()
181 .set_gain_p(4)
182 .set_gain_i(8)
183 .set_gain_d(0)
184 .set_initial_control_value(TargetLogBdp())
185 .set_min_control_value(-1)
186 .set_max_control_value(25)
187 .set_integral_range(10)),
188 last_pid_update_(grpc_core::ExecCtx::Get()->Now()) {}
189
MaybeSendUpdate(bool writing_anyway)190 uint32_t TransportFlowControl::MaybeSendUpdate(bool writing_anyway) {
191 FlowControlTrace trace("t updt sent", this, nullptr);
192 const uint32_t target_announced_window =
193 static_cast<const uint32_t>(target_window());
194 if ((writing_anyway || announced_window_ <= target_announced_window / 2) &&
195 announced_window_ != target_announced_window) {
196 const uint32_t announce = static_cast<uint32_t> GPR_CLAMP(
197 target_announced_window - announced_window_, 0, kMaxWindowUpdateSize);
198 announced_window_ += announce;
199 return announce;
200 }
201 return 0;
202 }
203
ValidateRecvData(int64_t incoming_frame_size)204 grpc_error* TransportFlowControl::ValidateRecvData(
205 int64_t incoming_frame_size) {
206 if (incoming_frame_size > announced_window_) {
207 char* msg;
208 gpr_asprintf(&msg,
209 "frame of size %" PRId64 " overflows local window of %" PRId64,
210 incoming_frame_size, announced_window_);
211 grpc_error* err = GRPC_ERROR_CREATE_FROM_COPIED_STRING(msg);
212 gpr_free(msg);
213 return err;
214 }
215 return GRPC_ERROR_NONE;
216 }
217
StreamFlowControl(TransportFlowControl * tfc,const grpc_chttp2_stream * s)218 StreamFlowControl::StreamFlowControl(TransportFlowControl* tfc,
219 const grpc_chttp2_stream* s)
220 : tfc_(tfc), s_(s) {}
221
RecvData(int64_t incoming_frame_size)222 grpc_error* StreamFlowControl::RecvData(int64_t incoming_frame_size) {
223 FlowControlTrace trace(" data recv", tfc_, this);
224
225 grpc_error* error = GRPC_ERROR_NONE;
226 error = tfc_->ValidateRecvData(incoming_frame_size);
227 if (error != GRPC_ERROR_NONE) return error;
228
229 uint32_t sent_init_window =
230 tfc_->transport()->settings[GRPC_SENT_SETTINGS]
231 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
232 uint32_t acked_init_window =
233 tfc_->transport()->settings[GRPC_ACKED_SETTINGS]
234 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
235
236 int64_t acked_stream_window = announced_window_delta_ + acked_init_window;
237 int64_t sent_stream_window = announced_window_delta_ + sent_init_window;
238 if (incoming_frame_size > acked_stream_window) {
239 if (incoming_frame_size <= sent_stream_window) {
240 gpr_log(GPR_ERROR,
241 "Incoming frame of size %" PRId64
242 " exceeds local window size of %" PRId64
243 ".\n"
244 "The (un-acked, future) window size would be %" PRId64
245 " which is not exceeded.\n"
246 "This would usually cause a disconnection, but allowing it due to"
247 "broken HTTP2 implementations in the wild.\n"
248 "See (for example) https://github.com/netty/netty/issues/6520.",
249 incoming_frame_size, acked_stream_window, sent_stream_window);
250 } else {
251 char* msg;
252 gpr_asprintf(
253 &msg, "frame of size %" PRId64 " overflows local window of %" PRId64,
254 incoming_frame_size, acked_stream_window);
255 grpc_error* err = GRPC_ERROR_CREATE_FROM_COPIED_STRING(msg);
256 gpr_free(msg);
257 return err;
258 }
259 }
260
261 UpdateAnnouncedWindowDelta(tfc_, -incoming_frame_size);
262 local_window_delta_ -= incoming_frame_size;
263 tfc_->CommitRecvData(incoming_frame_size);
264 return GRPC_ERROR_NONE;
265 }
266
MaybeSendUpdate()267 uint32_t StreamFlowControl::MaybeSendUpdate() {
268 FlowControlTrace trace("s updt sent", tfc_, this);
269 if (local_window_delta_ > announced_window_delta_) {
270 uint32_t announce = static_cast<uint32_t> GPR_CLAMP(
271 local_window_delta_ - announced_window_delta_, 0, kMaxWindowUpdateSize);
272 UpdateAnnouncedWindowDelta(tfc_, announce);
273 return announce;
274 }
275 return 0;
276 }
277
IncomingByteStreamUpdate(size_t max_size_hint,size_t have_already)278 void StreamFlowControl::IncomingByteStreamUpdate(size_t max_size_hint,
279 size_t have_already) {
280 FlowControlTrace trace("app st recv", tfc_, this);
281 uint32_t max_recv_bytes;
282 uint32_t sent_init_window =
283 tfc_->transport()->settings[GRPC_SENT_SETTINGS]
284 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
285
286 /* clamp max recv hint to an allowable size */
287 if (max_size_hint >= UINT32_MAX - sent_init_window) {
288 max_recv_bytes = UINT32_MAX - sent_init_window;
289 } else {
290 max_recv_bytes = static_cast<uint32_t>(max_size_hint);
291 }
292
293 /* account for bytes already received but unknown to higher layers */
294 if (max_recv_bytes >= have_already) {
295 max_recv_bytes -= static_cast<uint32_t>(have_already);
296 } else {
297 max_recv_bytes = 0;
298 }
299
300 /* add some small lookahead to keep pipelines flowing */
301 GPR_ASSERT(max_recv_bytes <= UINT32_MAX - sent_init_window);
302 if (local_window_delta_ < max_recv_bytes) {
303 uint32_t add_max_recv_bytes =
304 static_cast<uint32_t>(max_recv_bytes - local_window_delta_);
305 local_window_delta_ += add_max_recv_bytes;
306 }
307 }
308
309 // Take in a target and modifies it based on the memory pressure of the system
AdjustForMemoryPressure(grpc_resource_quota * quota,double target)310 static double AdjustForMemoryPressure(grpc_resource_quota* quota,
311 double target) {
312 // do not increase window under heavy memory pressure.
313 double memory_pressure = grpc_resource_quota_get_memory_pressure(quota);
314 static const double kLowMemPressure = 0.1;
315 static const double kZeroTarget = 22;
316 static const double kHighMemPressure = 0.8;
317 static const double kMaxMemPressure = 0.9;
318 if (memory_pressure < kLowMemPressure && target < kZeroTarget) {
319 target = (target - kZeroTarget) * memory_pressure / kLowMemPressure +
320 kZeroTarget;
321 } else if (memory_pressure > kHighMemPressure) {
322 target *= 1 - GPR_MIN(1, (memory_pressure - kHighMemPressure) /
323 (kMaxMemPressure - kHighMemPressure));
324 }
325 return target;
326 }
327
TargetLogBdp()328 double TransportFlowControl::TargetLogBdp() {
329 return AdjustForMemoryPressure(
330 grpc_resource_user_quota(grpc_endpoint_get_resource_user(t_->ep)),
331 1 + log2(bdp_estimator_.EstimateBdp()));
332 }
333
SmoothLogBdp(double value)334 double TransportFlowControl::SmoothLogBdp(double value) {
335 grpc_millis now = grpc_core::ExecCtx::Get()->Now();
336 double bdp_error = value - pid_controller_.last_control_value();
337 const double dt = static_cast<double>(now - last_pid_update_) * 1e-3;
338 last_pid_update_ = now;
339 // Limit dt to 100ms
340 const double kMaxDt = 0.1;
341 return pid_controller_.Update(bdp_error, dt > kMaxDt ? kMaxDt : dt);
342 }
343
DeltaUrgency(int64_t value,grpc_chttp2_setting_id setting_id)344 FlowControlAction::Urgency TransportFlowControl::DeltaUrgency(
345 int64_t value, grpc_chttp2_setting_id setting_id) {
346 int64_t delta = value - static_cast<int64_t>(
347 t_->settings[GRPC_LOCAL_SETTINGS][setting_id]);
348 // TODO(ncteisen): tune this
349 if (delta != 0 && (delta <= -value / 5 || delta >= value / 5)) {
350 return FlowControlAction::Urgency::QUEUE_UPDATE;
351 } else {
352 return FlowControlAction::Urgency::NO_ACTION_NEEDED;
353 }
354 }
355
PeriodicUpdate()356 FlowControlAction TransportFlowControl::PeriodicUpdate() {
357 FlowControlAction action;
358 if (enable_bdp_probe_) {
359 // get bdp estimate and update initial_window accordingly.
360 // target might change based on how much memory pressure we are under
361 // TODO(ncteisen): experiment with setting target to be huge under low
362 // memory pressure.
363 const double target = pow(2, SmoothLogBdp(TargetLogBdp()));
364
365 // Though initial window 'could' drop to 0, we keep the floor at 128
366 target_initial_window_size_ =
367 static_cast<int32_t> GPR_CLAMP(target, 128, INT32_MAX);
368
369 action.set_send_initial_window_update(
370 DeltaUrgency(target_initial_window_size_,
371 GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE),
372 static_cast<uint32_t>(target_initial_window_size_));
373
374 // get bandwidth estimate and update max_frame accordingly.
375 double bw_dbl = bdp_estimator_.EstimateBandwidth();
376 // we target the max of BDP or bandwidth in microseconds.
377 int32_t frame_size = static_cast<int32_t> GPR_CLAMP(
378 GPR_MAX((int32_t)GPR_CLAMP(bw_dbl, 0, INT_MAX) / 1000,
379 target_initial_window_size_),
380 16384, 16777215);
381 action.set_send_max_frame_size_update(
382 DeltaUrgency(static_cast<int64_t>(frame_size),
383 GRPC_CHTTP2_SETTINGS_MAX_FRAME_SIZE),
384 frame_size);
385 }
386 return UpdateAction(action);
387 }
388
UpdateAction(FlowControlAction action)389 FlowControlAction StreamFlowControl::UpdateAction(FlowControlAction action) {
390 // TODO(ncteisen): tune this
391 if (!s_->read_closed) {
392 uint32_t sent_init_window =
393 tfc_->transport()->settings[GRPC_SENT_SETTINGS]
394 [GRPC_CHTTP2_SETTINGS_INITIAL_WINDOW_SIZE];
395 if (local_window_delta_ > announced_window_delta_ &&
396 announced_window_delta_ + sent_init_window <= sent_init_window / 2) {
397 action.set_send_stream_update(
398 FlowControlAction::Urgency::UPDATE_IMMEDIATELY);
399 } else if (local_window_delta_ > announced_window_delta_) {
400 action.set_send_stream_update(FlowControlAction::Urgency::QUEUE_UPDATE);
401 }
402 }
403
404 return action;
405 }
406
407 } // namespace chttp2
408 } // namespace grpc_core
409