xref: /openssl/ssl/quic/quic_txp.c (revision c3542b22)
1 /*
2  * Copyright 2022-2024 The OpenSSL Project Authors. All Rights Reserved.
3  *
4  * Licensed under the Apache License 2.0 (the "License").  You may not use
5  * this file except in compliance with the License.  You can obtain a copy
6  * in the file LICENSE in the source distribution or at
7  * https://www.openssl.org/source/license.html
8  */
9 
10 #include "internal/quic_txp.h"
11 #include "internal/quic_fifd.h"
12 #include "internal/quic_stream_map.h"
13 #include "internal/quic_error.h"
14 #include "internal/common.h"
15 #include <openssl/err.h>
16 
17 #define MIN_CRYPTO_HDR_SIZE             3
18 
19 #define MIN_FRAME_SIZE_HANDSHAKE_DONE   1
20 #define MIN_FRAME_SIZE_MAX_DATA         2
21 #define MIN_FRAME_SIZE_ACK              5
22 #define MIN_FRAME_SIZE_CRYPTO           (MIN_CRYPTO_HDR_SIZE + 1)
23 #define MIN_FRAME_SIZE_STREAM           3 /* minimum useful size (for non-FIN) */
24 #define MIN_FRAME_SIZE_MAX_STREAMS_BIDI 2
25 #define MIN_FRAME_SIZE_MAX_STREAMS_UNI  2
26 
27 /*
28  * Packet Archetypes
29  * =================
30  */
31 
32 /* Generate normal packets containing most frame types, subject to EL. */
33 #define TX_PACKETISER_ARCHETYPE_NORMAL              0
34 
35 /*
36  * A probe packet is different in that:
37  *   - It bypasses CC, but *is* counted as in flight for purposes of CC;
38  *   - It must be ACK-eliciting.
39  */
40 #define TX_PACKETISER_ARCHETYPE_PROBE               1
41 
42 /*
43  * An ACK-only packet is different in that:
44  *   - It bypasses CC, and is considered a 'non-inflight' packet;
45  *   - It may not contain anything other than an ACK frame, not even padding.
46  */
47 #define TX_PACKETISER_ARCHETYPE_ACK_ONLY            2
48 
49 #define TX_PACKETISER_ARCHETYPE_NUM                 3
50 
51 struct ossl_quic_tx_packetiser_st {
52     OSSL_QUIC_TX_PACKETISER_ARGS args;
53 
54     /*
55      * Opaque initial token blob provided by caller. TXP frees using the
56      * callback when it is no longer needed.
57      */
58     const unsigned char             *initial_token;
59     size_t                          initial_token_len;
60     ossl_quic_initial_token_free_fn *initial_token_free_cb;
61     void                            *initial_token_free_cb_arg;
62 
63     /* Subcomponents of the TXP that we own. */
64     QUIC_FIFD       fifd;       /* QUIC Frame-in-Flight Dispatcher */
65 
66     /* Internal state. */
67     uint64_t        next_pn[QUIC_PN_SPACE_NUM]; /* Next PN to use in given PN space. */
68     OSSL_TIME       last_tx_time;               /* Last time a packet was generated, or 0. */
69 
70     /* Internal state - frame (re)generation flags. */
71     unsigned int    want_handshake_done     : 1;
72     unsigned int    want_max_data           : 1;
73     unsigned int    want_max_streams_bidi   : 1;
74     unsigned int    want_max_streams_uni    : 1;
75 
76     /* Internal state - frame (re)generation flags - per PN space. */
77     unsigned int    want_ack                : QUIC_PN_SPACE_NUM;
78     unsigned int    force_ack_eliciting     : QUIC_PN_SPACE_NUM;
79 
80     /*
81      * Internal state - connection close terminal state.
82      * Once this is set, it is not unset unlike other want_ flags - we keep
83      * sending it in every packet.
84      */
85     unsigned int    want_conn_close         : 1;
86 
87     /* Has the handshake been completed? */
88     unsigned int    handshake_complete      : 1;
89 
90     OSSL_QUIC_FRAME_CONN_CLOSE  conn_close_frame;
91 
92     /*
93      * Counts of the number of bytes received and sent while in the closing
94      * state.
95      */
96     uint64_t                        closing_bytes_recv;
97     uint64_t                        closing_bytes_xmit;
98 
99     /* Internal state - packet assembly. */
100     struct txp_el {
101         unsigned char   *scratch;       /* scratch buffer for packet assembly */
102         size_t          scratch_len;    /* number of bytes allocated for scratch */
103         OSSL_QTX_IOVEC  *iovec;         /* scratch iovec array for use with QTX */
104         size_t          alloc_iovec;    /* size of iovec array */
105     } el[QUIC_ENC_LEVEL_NUM];
106 
107     /* Message callback related arguments */
108     ossl_msg_cb msg_callback;
109     void *msg_callback_arg;
110     SSL *msg_callback_ssl;
111 
112     /* Callbacks. */
113     void            (*ack_tx_cb)(const OSSL_QUIC_FRAME_ACK *ack,
114                                  uint32_t pn_space,
115                                  void *arg);
116     void            *ack_tx_cb_arg;
117 };
118 
119 /*
120  * The TX helper records state used while generating frames into packets. It
121  * enables serialization into the packet to be done "transactionally" where
122  * serialization of a frame can be rolled back if it fails midway (e.g. if it
123  * does not fit).
124  */
125 struct tx_helper {
126     OSSL_QUIC_TX_PACKETISER *txp;
127     /*
128      * The Maximum Packet Payload Length in bytes. This is the amount of
129      * space we have to generate frames into.
130      */
131     size_t max_ppl;
132     /*
133      * Number of bytes we have generated so far.
134      */
135     size_t bytes_appended;
136     /*
137      * Number of scratch bytes in txp->scratch we have used so far. Some iovecs
138      * will reference this scratch buffer. When we need to use more of it (e.g.
139      * when we need to put frame headers somewhere), we append to the scratch
140      * buffer, resizing if necessary, and increase this accordingly.
141      */
142     size_t scratch_bytes;
143     /*
144      * Bytes reserved in the MaxPPL budget. We keep this number of bytes spare
145      * until reserve_allowed is set to 1. Currently this is always at most 1, as
146      * a PING frame takes up one byte and this mechanism is only used to ensure
147      * we can encode a PING frame if we have been asked to ensure a packet is
148      * ACK-eliciting and we are unusure if we are going to add any other
149      * ACK-eliciting frames before we reach our MaxPPL budget.
150      */
151     size_t reserve;
152     /*
153      * Number of iovecs we have currently appended. This is the number of
154      * entries valid in txp->iovec.
155      */
156     size_t num_iovec;
157     /* The EL this TX helper is being used for. */
158     uint32_t enc_level;
159     /*
160      * Whether we are allowed to make use of the reserve bytes in our MaxPPL
161      * budget. This is used to ensure we have room to append a PING frame later
162      * if we need to. Once we know we will not need to append a PING frame, this
163      * is set to 1.
164      */
165     unsigned int reserve_allowed : 1;
166     /*
167      * Set to 1 if we have appended a STREAM frame with an implicit length. If
168      * this happens we should never append another frame after that frame as it
169      * cannot be validly encoded. This is just a safety check.
170      */
171     unsigned int done_implicit : 1;
172     struct {
173         /*
174          * The fields in this structure are valid if active is set, which means
175          * that a serialization transaction is currently in progress.
176          */
177         unsigned char   *data;
178         WPACKET         wpkt;
179         unsigned int    active : 1;
180     } txn;
181 };
182 
183 static void tx_helper_rollback(struct tx_helper *h);
184 static int txp_el_ensure_iovec(struct txp_el *el, size_t num);
185 
186 /* Initialises the TX helper. */
tx_helper_init(struct tx_helper * h,OSSL_QUIC_TX_PACKETISER * txp,uint32_t enc_level,size_t max_ppl,size_t reserve)187 static int tx_helper_init(struct tx_helper *h, OSSL_QUIC_TX_PACKETISER *txp,
188                           uint32_t enc_level, size_t max_ppl, size_t reserve)
189 {
190     if (reserve > max_ppl)
191         return 0;
192 
193     h->txp                  = txp;
194     h->enc_level            = enc_level;
195     h->max_ppl              = max_ppl;
196     h->reserve              = reserve;
197     h->num_iovec            = 0;
198     h->bytes_appended       = 0;
199     h->scratch_bytes        = 0;
200     h->reserve_allowed      = 0;
201     h->done_implicit        = 0;
202     h->txn.data             = NULL;
203     h->txn.active           = 0;
204 
205     if (max_ppl > h->txp->el[enc_level].scratch_len) {
206         unsigned char *scratch;
207 
208         scratch = OPENSSL_realloc(h->txp->el[enc_level].scratch, max_ppl);
209         if (scratch == NULL)
210             return 0;
211 
212         h->txp->el[enc_level].scratch     = scratch;
213         h->txp->el[enc_level].scratch_len = max_ppl;
214     }
215 
216     return 1;
217 }
218 
tx_helper_cleanup(struct tx_helper * h)219 static void tx_helper_cleanup(struct tx_helper *h)
220 {
221     if (h->txn.active)
222         tx_helper_rollback(h);
223 
224     h->txp = NULL;
225 }
226 
tx_helper_unrestrict(struct tx_helper * h)227 static void tx_helper_unrestrict(struct tx_helper *h)
228 {
229     h->reserve_allowed = 1;
230 }
231 
232 /*
233  * Append an extent of memory to the iovec list. The memory must remain
234  * allocated until we finish generating the packet and call the QTX.
235  *
236  * In general, the buffers passed to this function will be from one of two
237  * ranges:
238  *
239  *   - Application data contained in stream buffers managed elsewhere
240  *     in the QUIC stack; or
241  *
242  *   - Control frame data appended into txp->scratch using tx_helper_begin and
243  *     tx_helper_commit.
244  *
245  */
tx_helper_append_iovec(struct tx_helper * h,const unsigned char * buf,size_t buf_len)246 static int tx_helper_append_iovec(struct tx_helper *h,
247                                   const unsigned char *buf,
248                                   size_t buf_len)
249 {
250     struct txp_el *el = &h->txp->el[h->enc_level];
251 
252     if (buf_len == 0)
253         return 1;
254 
255     if (!ossl_assert(!h->done_implicit))
256         return 0;
257 
258     if (!txp_el_ensure_iovec(el, h->num_iovec + 1))
259         return 0;
260 
261     el->iovec[h->num_iovec].buf     = buf;
262     el->iovec[h->num_iovec].buf_len = buf_len;
263 
264     ++h->num_iovec;
265     h->bytes_appended += buf_len;
266     return 1;
267 }
268 
269 /*
270  * How many more bytes of space do we have left in our plaintext packet payload?
271  */
tx_helper_get_space_left(struct tx_helper * h)272 static size_t tx_helper_get_space_left(struct tx_helper *h)
273 {
274     return h->max_ppl
275         - (h->reserve_allowed ? 0 : h->reserve) - h->bytes_appended;
276 }
277 
278 /*
279  * Begin a control frame serialization transaction. This allows the
280  * serialization of the control frame to be backed out if it turns out it won't
281  * fit. Write the control frame to the returned WPACKET. Ensure you always
282  * call tx_helper_rollback or tx_helper_commit (or tx_helper_cleanup). Returns
283  * NULL on failure.
284  */
tx_helper_begin(struct tx_helper * h)285 static WPACKET *tx_helper_begin(struct tx_helper *h)
286 {
287     size_t space_left, len;
288     unsigned char *data;
289     struct txp_el *el = &h->txp->el[h->enc_level];
290 
291     if (!ossl_assert(!h->txn.active))
292         return NULL;
293 
294     if (!ossl_assert(!h->done_implicit))
295         return NULL;
296 
297     data = (unsigned char *)el->scratch + h->scratch_bytes;
298     len  = el->scratch_len - h->scratch_bytes;
299 
300     space_left = tx_helper_get_space_left(h);
301     if (!ossl_assert(space_left <= len))
302         return NULL;
303 
304     if (!WPACKET_init_static_len(&h->txn.wpkt, data, len, 0))
305         return NULL;
306 
307     if (!WPACKET_set_max_size(&h->txn.wpkt, space_left)) {
308         WPACKET_cleanup(&h->txn.wpkt);
309         return NULL;
310     }
311 
312     h->txn.data     = data;
313     h->txn.active   = 1;
314     return &h->txn.wpkt;
315 }
316 
tx_helper_end(struct tx_helper * h,int success)317 static void tx_helper_end(struct tx_helper *h, int success)
318 {
319     if (success)
320         WPACKET_finish(&h->txn.wpkt);
321     else
322         WPACKET_cleanup(&h->txn.wpkt);
323 
324     h->txn.active       = 0;
325     h->txn.data         = NULL;
326 }
327 
328 /* Abort a control frame serialization transaction. */
tx_helper_rollback(struct tx_helper * h)329 static void tx_helper_rollback(struct tx_helper *h)
330 {
331     if (!h->txn.active)
332         return;
333 
334     tx_helper_end(h, 0);
335 }
336 
337 /* Commit a control frame. */
tx_helper_commit(struct tx_helper * h)338 static int tx_helper_commit(struct tx_helper *h)
339 {
340     size_t l = 0;
341 
342     if (!h->txn.active)
343         return 0;
344 
345     if (!WPACKET_get_total_written(&h->txn.wpkt, &l)) {
346         tx_helper_end(h, 0);
347         return 0;
348     }
349 
350     if (!tx_helper_append_iovec(h, h->txn.data, l)) {
351         tx_helper_end(h, 0);
352         return 0;
353     }
354 
355     if (h->txp->msg_callback != NULL && l > 0) {
356         uint64_t ftype;
357         int ctype = SSL3_RT_QUIC_FRAME_FULL;
358         PACKET pkt;
359 
360         if (!PACKET_buf_init(&pkt, h->txn.data, l)
361                 || !ossl_quic_wire_peek_frame_header(&pkt, &ftype, NULL)) {
362             tx_helper_end(h, 0);
363             return 0;
364         }
365 
366         if (ftype == OSSL_QUIC_FRAME_TYPE_PADDING)
367             ctype = SSL3_RT_QUIC_FRAME_PADDING;
368         else if (OSSL_QUIC_FRAME_TYPE_IS_STREAM(ftype)
369                 || ftype == OSSL_QUIC_FRAME_TYPE_CRYPTO)
370             ctype = SSL3_RT_QUIC_FRAME_HEADER;
371 
372         h->txp->msg_callback(1, OSSL_QUIC1_VERSION, ctype, h->txn.data, l,
373                              h->txp->msg_callback_ssl,
374                              h->txp->msg_callback_arg);
375     }
376 
377     h->scratch_bytes += l;
378     tx_helper_end(h, 1);
379     return 1;
380 }
381 
382 struct archetype_data {
383     unsigned int allow_ack                  : 1;
384     unsigned int allow_ping                 : 1;
385     unsigned int allow_crypto               : 1;
386     unsigned int allow_handshake_done       : 1;
387     unsigned int allow_path_challenge       : 1;
388     unsigned int allow_path_response        : 1;
389     unsigned int allow_new_conn_id          : 1;
390     unsigned int allow_retire_conn_id       : 1;
391     unsigned int allow_stream_rel           : 1;
392     unsigned int allow_conn_fc              : 1;
393     unsigned int allow_conn_close           : 1;
394     unsigned int allow_cfq_other            : 1;
395     unsigned int allow_new_token            : 1;
396     unsigned int allow_force_ack_eliciting  : 1;
397     unsigned int allow_padding              : 1;
398     unsigned int require_ack_eliciting      : 1;
399     unsigned int bypass_cc                  : 1;
400 };
401 
402 struct txp_pkt_geom {
403     size_t                  cmpl, cmppl, hwm, pkt_overhead;
404     uint32_t                archetype;
405     struct archetype_data   adata;
406 };
407 
408 struct txp_pkt {
409     struct tx_helper    h;
410     int                 h_valid;
411     QUIC_TXPIM_PKT      *tpkt;
412     QUIC_STREAM         *stream_head;
413     QUIC_PKT_HDR        phdr;
414     struct txp_pkt_geom geom;
415     int                 force_pad;
416 };
417 
418 static QUIC_SSTREAM *get_sstream_by_id(uint64_t stream_id, uint32_t pn_space,
419                                        void *arg);
420 static void on_regen_notify(uint64_t frame_type, uint64_t stream_id,
421                             QUIC_TXPIM_PKT *pkt, void *arg);
422 static void on_confirm_notify(uint64_t frame_type, uint64_t stream_id,
423                               QUIC_TXPIM_PKT *pkt, void *arg);
424 static void on_sstream_updated(uint64_t stream_id, void *arg);
425 static int sstream_is_pending(QUIC_SSTREAM *sstream);
426 static int txp_should_try_staging(OSSL_QUIC_TX_PACKETISER *txp,
427                                   uint32_t enc_level,
428                                   uint32_t archetype,
429                                   uint64_t cc_limit,
430                                   uint32_t *conn_close_enc_level);
431 static size_t txp_determine_pn_len(OSSL_QUIC_TX_PACKETISER *txp);
432 static int txp_determine_ppl_from_pl(OSSL_QUIC_TX_PACKETISER *txp,
433                                      size_t pl,
434                                      uint32_t enc_level,
435                                      size_t hdr_len,
436                                      size_t *r);
437 static size_t txp_get_mdpl(OSSL_QUIC_TX_PACKETISER *txp);
438 static int txp_generate_for_el(OSSL_QUIC_TX_PACKETISER *txp,
439                                struct txp_pkt *pkt,
440                                int chosen_for_conn_close);
441 static int txp_pkt_init(struct txp_pkt *pkt, OSSL_QUIC_TX_PACKETISER *txp,
442                         uint32_t enc_level, uint32_t archetype,
443                         size_t running_total);
444 static void txp_pkt_cleanup(struct txp_pkt *pkt, OSSL_QUIC_TX_PACKETISER *txp);
445 static int txp_pkt_postgen_update_pkt_overhead(struct txp_pkt *pkt,
446                                                OSSL_QUIC_TX_PACKETISER *txp);
447 static int txp_pkt_append_padding(struct txp_pkt *pkt,
448                                   OSSL_QUIC_TX_PACKETISER *txp, size_t num_bytes);
449 static int txp_pkt_commit(OSSL_QUIC_TX_PACKETISER *txp, struct txp_pkt *pkt,
450                           uint32_t archetype, int *txpim_pkt_reffed);
451 static uint32_t txp_determine_archetype(OSSL_QUIC_TX_PACKETISER *txp,
452                                         uint64_t cc_limit);
453 
ossl_quic_tx_packetiser_new(const OSSL_QUIC_TX_PACKETISER_ARGS * args)454 OSSL_QUIC_TX_PACKETISER *ossl_quic_tx_packetiser_new(const OSSL_QUIC_TX_PACKETISER_ARGS *args)
455 {
456     OSSL_QUIC_TX_PACKETISER *txp;
457 
458     if (args == NULL
459         || args->qtx == NULL
460         || args->txpim == NULL
461         || args->cfq == NULL
462         || args->ackm == NULL
463         || args->qsm == NULL
464         || args->conn_txfc == NULL
465         || args->conn_rxfc == NULL
466         || args->max_streams_bidi_rxfc == NULL
467         || args->max_streams_uni_rxfc == NULL) {
468         ERR_raise(ERR_LIB_SSL, ERR_R_PASSED_NULL_PARAMETER);
469         return NULL;
470     }
471 
472     txp = OPENSSL_zalloc(sizeof(*txp));
473     if (txp == NULL)
474         return NULL;
475 
476     txp->args           = *args;
477     txp->last_tx_time   = ossl_time_zero();
478 
479     if (!ossl_quic_fifd_init(&txp->fifd,
480                              txp->args.cfq, txp->args.ackm, txp->args.txpim,
481                              get_sstream_by_id, txp,
482                              on_regen_notify, txp,
483                              on_confirm_notify, txp,
484                              on_sstream_updated, txp,
485                              args->get_qlog_cb,
486                              args->get_qlog_cb_arg)) {
487         OPENSSL_free(txp);
488         return NULL;
489     }
490 
491     return txp;
492 }
493 
ossl_quic_tx_packetiser_free(OSSL_QUIC_TX_PACKETISER * txp)494 void ossl_quic_tx_packetiser_free(OSSL_QUIC_TX_PACKETISER *txp)
495 {
496     uint32_t enc_level;
497 
498     if (txp == NULL)
499         return;
500 
501     ossl_quic_tx_packetiser_set_initial_token(txp, NULL, 0, NULL, NULL);
502     ossl_quic_fifd_cleanup(&txp->fifd);
503     OPENSSL_free(txp->conn_close_frame.reason);
504 
505     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
506          enc_level < QUIC_ENC_LEVEL_NUM;
507          ++enc_level) {
508         OPENSSL_free(txp->el[enc_level].iovec);
509         OPENSSL_free(txp->el[enc_level].scratch);
510     }
511 
512     OPENSSL_free(txp);
513 }
514 
515 /*
516  * Determine if an Initial packet token length is reasonable based on the
517  * current MDPL, returning 1 if it is OK.
518  *
519  * The real PMTU to the peer could differ from our (pessimistic) understanding
520  * of the PMTU, therefore it is possible we could receive an Initial token from
521  * a server in a Retry packet which is bigger than the MDPL. In this case it is
522  * impossible for us ever to make forward progress and we need to error out
523  * and fail the connection attempt.
524  *
525  * The specific boundary condition is complex: for example, after the size of
526  * the Initial token, there are the Initial packet header overheads and then
527  * encryption/AEAD tag overheads. After that, the minimum room for frame data in
528  * order to guarantee forward progress must be guaranteed. For example, a crypto
529  * stream needs to always be able to serialize at least one byte in a CRYPTO
530  * frame in order to make forward progress. Because the offset field of a CRYPTO
531  * frame uses a variable-length integer, the number of bytes needed to ensure
532  * this also varies.
533  *
534  * Rather than trying to get this boundary condition check actually right,
535  * require a reasonable amount of slack to avoid pathological behaviours. (After
536  * all, transmitting a CRYPTO stream one byte at a time is probably not
537  * desirable anyway.)
538  *
539  * We choose 160 bytes as the required margin, which is double the rough
540  * estimation of the minimum we would require to guarantee forward progress
541  * under worst case packet overheads.
542  */
543 #define TXP_REQUIRED_TOKEN_MARGIN       160
544 
txp_check_token_len(size_t token_len,size_t mdpl)545 static int txp_check_token_len(size_t token_len, size_t mdpl)
546 {
547     if (token_len == 0)
548         return 1;
549 
550     if (token_len >= mdpl)
551         return 0;
552 
553     if (TXP_REQUIRED_TOKEN_MARGIN >= mdpl)
554         /* (should not be possible because MDPL must be at least 1200) */
555         return 0;
556 
557     if (token_len > mdpl - TXP_REQUIRED_TOKEN_MARGIN)
558         return 0;
559 
560     return 1;
561 }
562 
ossl_quic_tx_packetiser_set_initial_token(OSSL_QUIC_TX_PACKETISER * txp,const unsigned char * token,size_t token_len,ossl_quic_initial_token_free_fn * free_cb,void * free_cb_arg)563 int ossl_quic_tx_packetiser_set_initial_token(OSSL_QUIC_TX_PACKETISER *txp,
564                                               const unsigned char *token,
565                                               size_t token_len,
566                                               ossl_quic_initial_token_free_fn *free_cb,
567                                               void *free_cb_arg)
568 {
569     if (!txp_check_token_len(token_len, txp_get_mdpl(txp)))
570         return 0;
571 
572     if (txp->initial_token != NULL && txp->initial_token_free_cb != NULL)
573         txp->initial_token_free_cb(txp->initial_token, txp->initial_token_len,
574                                    txp->initial_token_free_cb_arg);
575 
576     txp->initial_token              = token;
577     txp->initial_token_len          = token_len;
578     txp->initial_token_free_cb      = free_cb;
579     txp->initial_token_free_cb_arg  = free_cb_arg;
580     return 1;
581 }
582 
ossl_quic_tx_packetiser_set_cur_dcid(OSSL_QUIC_TX_PACKETISER * txp,const QUIC_CONN_ID * dcid)583 int ossl_quic_tx_packetiser_set_cur_dcid(OSSL_QUIC_TX_PACKETISER *txp,
584                                          const QUIC_CONN_ID *dcid)
585 {
586     if (dcid == NULL) {
587         ERR_raise(ERR_LIB_SSL, ERR_R_PASSED_NULL_PARAMETER);
588         return 0;
589     }
590 
591     txp->args.cur_dcid = *dcid;
592     return 1;
593 }
594 
ossl_quic_tx_packetiser_set_cur_scid(OSSL_QUIC_TX_PACKETISER * txp,const QUIC_CONN_ID * scid)595 int ossl_quic_tx_packetiser_set_cur_scid(OSSL_QUIC_TX_PACKETISER *txp,
596                                          const QUIC_CONN_ID *scid)
597 {
598     if (scid == NULL) {
599         ERR_raise(ERR_LIB_SSL, ERR_R_PASSED_NULL_PARAMETER);
600         return 0;
601     }
602 
603     txp->args.cur_scid = *scid;
604     return 1;
605 }
606 
607 /* Change the destination L4 address the TXP uses to send datagrams. */
ossl_quic_tx_packetiser_set_peer(OSSL_QUIC_TX_PACKETISER * txp,const BIO_ADDR * peer)608 int ossl_quic_tx_packetiser_set_peer(OSSL_QUIC_TX_PACKETISER *txp,
609                                      const BIO_ADDR *peer)
610 {
611     if (peer == NULL) {
612         BIO_ADDR_clear(&txp->args.peer);
613         return 1;
614     }
615 
616     txp->args.peer = *peer;
617     return 1;
618 }
619 
ossl_quic_tx_packetiser_set_ack_tx_cb(OSSL_QUIC_TX_PACKETISER * txp,void (* cb)(const OSSL_QUIC_FRAME_ACK * ack,uint32_t pn_space,void * arg),void * cb_arg)620 void ossl_quic_tx_packetiser_set_ack_tx_cb(OSSL_QUIC_TX_PACKETISER *txp,
621                                            void (*cb)(const OSSL_QUIC_FRAME_ACK *ack,
622                                                       uint32_t pn_space,
623                                                       void *arg),
624                                            void *cb_arg)
625 {
626     txp->ack_tx_cb      = cb;
627     txp->ack_tx_cb_arg  = cb_arg;
628 }
629 
ossl_quic_tx_packetiser_set_qlog_cb(OSSL_QUIC_TX_PACKETISER * txp,QLOG * (* get_qlog_cb)(void * arg),void * get_qlog_cb_arg)630 void ossl_quic_tx_packetiser_set_qlog_cb(OSSL_QUIC_TX_PACKETISER *txp,
631                                          QLOG *(*get_qlog_cb)(void *arg),
632                                          void *get_qlog_cb_arg)
633 {
634     ossl_quic_fifd_set_qlog_cb(&txp->fifd, get_qlog_cb, get_qlog_cb_arg);
635 
636 }
637 
ossl_quic_tx_packetiser_discard_enc_level(OSSL_QUIC_TX_PACKETISER * txp,uint32_t enc_level)638 int ossl_quic_tx_packetiser_discard_enc_level(OSSL_QUIC_TX_PACKETISER *txp,
639                                               uint32_t enc_level)
640 {
641     if (enc_level >= QUIC_ENC_LEVEL_NUM) {
642         ERR_raise(ERR_LIB_SSL, ERR_R_PASSED_INVALID_ARGUMENT);
643         return 0;
644     }
645 
646     if (enc_level != QUIC_ENC_LEVEL_0RTT)
647         txp->args.crypto[ossl_quic_enc_level_to_pn_space(enc_level)] = NULL;
648 
649     return 1;
650 }
651 
ossl_quic_tx_packetiser_notify_handshake_complete(OSSL_QUIC_TX_PACKETISER * txp)652 void ossl_quic_tx_packetiser_notify_handshake_complete(OSSL_QUIC_TX_PACKETISER *txp)
653 {
654     txp->handshake_complete = 1;
655 }
656 
ossl_quic_tx_packetiser_schedule_handshake_done(OSSL_QUIC_TX_PACKETISER * txp)657 void ossl_quic_tx_packetiser_schedule_handshake_done(OSSL_QUIC_TX_PACKETISER *txp)
658 {
659     txp->want_handshake_done = 1;
660 }
661 
ossl_quic_tx_packetiser_schedule_ack_eliciting(OSSL_QUIC_TX_PACKETISER * txp,uint32_t pn_space)662 void ossl_quic_tx_packetiser_schedule_ack_eliciting(OSSL_QUIC_TX_PACKETISER *txp,
663                                                     uint32_t pn_space)
664 {
665     txp->force_ack_eliciting |= (1UL << pn_space);
666 }
667 
ossl_quic_tx_packetiser_schedule_ack(OSSL_QUIC_TX_PACKETISER * txp,uint32_t pn_space)668 void ossl_quic_tx_packetiser_schedule_ack(OSSL_QUIC_TX_PACKETISER *txp,
669                                           uint32_t pn_space)
670 {
671     txp->want_ack |= (1UL << pn_space);
672 }
673 
674 #define TXP_ERR_INTERNAL     0  /* Internal (e.g. alloc) error */
675 #define TXP_ERR_SUCCESS      1  /* Success */
676 #define TXP_ERR_SPACE        2  /* Not enough room for another packet */
677 #define TXP_ERR_INPUT        3  /* Invalid/malformed input */
678 
679 /*
680  * Generates a datagram by polling the various ELs to determine if they want to
681  * generate any frames, and generating a datagram which coalesces packets for
682  * any ELs which do.
683  */
ossl_quic_tx_packetiser_generate(OSSL_QUIC_TX_PACKETISER * txp,QUIC_TXP_STATUS * status)684 int ossl_quic_tx_packetiser_generate(OSSL_QUIC_TX_PACKETISER *txp,
685                                      QUIC_TXP_STATUS *status)
686 {
687     /*
688      * Called to generate one or more datagrams, each containing one or more
689      * packets.
690      *
691      * There are some tricky things to note here:
692      *
693      *   - The TXP is only concerned with generating encrypted packets;
694      *     other packets use a different path.
695      *
696      *   - Any datagram containing an Initial packet must have a payload length
697      *     (DPL) of at least 1200 bytes. This padding need not necessarily be
698      *     found in the Initial packet.
699      *
700      *     - It is desirable to be able to coalesce an Initial packet
701      *       with a Handshake packet. Since, before generating the Handshake
702      *       packet, we do not know how long it will be, we cannot know the
703      *       correct amount of padding to ensure a DPL of at least 1200 bytes.
704      *       Thus this padding must added to the Handshake packet (or whatever
705      *       packet is the last in the datagram).
706      *
707      *     - However, at the time that we generate the Initial packet,
708      *       we do not actually know for sure that we will be followed
709      *       in the datagram by another packet. For example, suppose we have
710      *       some queued data (e.g. crypto stream data for the HANDSHAKE EL)
711      *       it looks like we will want to send on the HANDSHAKE EL.
712      *       We could assume padding will be placed in the Handshake packet
713      *       subsequently and avoid adding any padding to the Initial packet
714      *       (which would leave no room for the Handshake packet in the
715      *       datagram).
716      *
717      *       However, this is not actually a safe assumption. Suppose that we
718      *       are using a link with a MDPL of 1200 bytes, the minimum allowed by
719      *       QUIC. Suppose that the Initial packet consumes 1195 bytes in total.
720      *       Since it is not possible to fit a Handshake packet in just 5 bytes,
721      *       upon trying to add a Handshake packet after generating the Initial
722      *       packet, we will discover we have no room to fit it! This is not a
723      *       problem in itself as another datagram can be sent subsequently, but
724      *       it is a problem because we were counting to use that packet to hold
725      *       the essential padding. But if we have already finished encrypting
726      *       the Initial packet, we cannot go and add padding to it anymore.
727      *       This leaves us stuck.
728      *
729      * Because of this, we have to plan multiple packets simultaneously, such
730      * that we can start generating a Handshake (or 0-RTT or 1-RTT, or so on)
731      * packet while still having the option to go back and add padding to the
732      * Initial packet if it turns out to be needed.
733      *
734      * Trying to predict ahead of time (e.g. during Initial packet generation)
735      * whether we will successfully generate a subsequent packet is fraught with
736      * error as it relies on a large number of variables:
737      *
738      *   - Do we have room to fit a packet header? (Consider that due to
739      *     variable-length integer encoding this is highly variable and can even
740      *     depend on payload length due to a variable-length Length field.)
741      *
742      *   - Can we fit even a single one of the frames we want to put in this
743      *     packet in the packet? (Each frame type has a bespoke encoding. While
744      *     our encodings of some frame types are adaptive based on the available
745      *     room - e.g. STREAM frames - ultimately all frame types have some
746      *     absolute minimum number of bytes to be successfully encoded. For
747      *     example, if after an Initial packet there is enough room to encode
748      *     only one byte of frame data, it is quite likely we can't send any of
749      *     the frames we wanted to send.) While this is not strictly a problem
750      *     because we could just fill the packet with padding frames, this is a
751      *     pointless packet and is wasteful.
752      *
753      * Thus we adopt a multi-phase architecture:
754      *
755      *   1. Archetype Selection: Determine desired packet archetype.
756      *
757      *   2. Packet Staging: Generation of packet information and packet payload
758      *      data (frame data) into staging areas.
759      *
760      *   3. Packet Adjustment: Adjustment of staged packets, adding padding to
761      *      the staged packets if needed.
762      *
763      *   4. Commit: The packets are sent to the QTX and recorded as having been
764      *      sent to the FIFM.
765      *
766      */
767     int res = 0, rc;
768     uint32_t archetype, enc_level;
769     uint32_t conn_close_enc_level = QUIC_ENC_LEVEL_NUM;
770     struct txp_pkt pkt[QUIC_ENC_LEVEL_NUM];
771     size_t pkts_done = 0;
772     uint64_t cc_limit = txp->args.cc_method->get_tx_allowance(txp->args.cc_data);
773     int need_padding = 0, txpim_pkt_reffed;
774 
775     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
776          enc_level < QUIC_ENC_LEVEL_NUM;
777          ++enc_level)
778         pkt[enc_level].h_valid = 0;
779 
780     memset(status, 0, sizeof(*status));
781 
782     /*
783      * Should not be needed, but a sanity check in case anyone else has been
784      * using the QTX.
785      */
786     ossl_qtx_finish_dgram(txp->args.qtx);
787 
788     /* 1. Archetype Selection */
789     archetype = txp_determine_archetype(txp, cc_limit);
790 
791     /* 2. Packet Staging */
792     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
793          enc_level < QUIC_ENC_LEVEL_NUM;
794          ++enc_level) {
795         size_t running_total = (enc_level > QUIC_ENC_LEVEL_INITIAL)
796             ? pkt[enc_level - 1].geom.hwm : 0;
797 
798         pkt[enc_level].geom.hwm = running_total;
799 
800         if (!txp_should_try_staging(txp, enc_level, archetype, cc_limit,
801                                     &conn_close_enc_level))
802             continue;
803 
804         if (!txp_pkt_init(&pkt[enc_level], txp, enc_level, archetype,
805                           running_total))
806             /*
807              * If this fails this is not a fatal error - it means the geometry
808              * planning determined there was not enough space for another
809              * packet. So just proceed with what we've already planned for.
810              */
811             break;
812 
813         rc = txp_generate_for_el(txp, &pkt[enc_level],
814                                  conn_close_enc_level == enc_level);
815         if (rc != TXP_ERR_SUCCESS)
816             goto out;
817 
818         if (pkt[enc_level].force_pad)
819             /*
820              * txp_generate_for_el emitted a frame which forces packet padding.
821              */
822             need_padding = 1;
823 
824         pkt[enc_level].geom.hwm = running_total
825             + pkt[enc_level].h.bytes_appended
826             + pkt[enc_level].geom.pkt_overhead;
827     }
828 
829     /* 3. Packet Adjustment */
830     if (pkt[QUIC_ENC_LEVEL_INITIAL].h_valid
831         && pkt[QUIC_ENC_LEVEL_INITIAL].h.bytes_appended > 0)
832         /*
833          * We have an Initial packet in this datagram, so we need to make sure
834          * the total size of the datagram is adequate.
835          */
836         need_padding = 1;
837 
838     if (need_padding) {
839         size_t total_dgram_size = 0;
840         const size_t min_dpl = QUIC_MIN_INITIAL_DGRAM_LEN;
841         uint32_t pad_el = QUIC_ENC_LEVEL_NUM;
842 
843         for (enc_level = QUIC_ENC_LEVEL_INITIAL;
844              enc_level < QUIC_ENC_LEVEL_NUM;
845              ++enc_level)
846             if (pkt[enc_level].h_valid && pkt[enc_level].h.bytes_appended > 0) {
847                 if (pad_el == QUIC_ENC_LEVEL_NUM
848                     /*
849                      * We might not be able to add padding, for example if we
850                      * are using the ACK_ONLY archetype.
851                      */
852                     && pkt[enc_level].geom.adata.allow_padding
853                     && !pkt[enc_level].h.done_implicit)
854                     pad_el = enc_level;
855 
856                 txp_pkt_postgen_update_pkt_overhead(&pkt[enc_level], txp);
857                 total_dgram_size += pkt[enc_level].geom.pkt_overhead
858                     + pkt[enc_level].h.bytes_appended;
859             }
860 
861         if (pad_el != QUIC_ENC_LEVEL_NUM && total_dgram_size < min_dpl) {
862             size_t deficit = min_dpl - total_dgram_size;
863 
864             if (!txp_pkt_append_padding(&pkt[pad_el], txp, deficit))
865                 goto out;
866 
867             total_dgram_size += deficit;
868 
869             /*
870              * Padding frames make a packet ineligible for being a non-inflight
871              * packet.
872              */
873             pkt[pad_el].tpkt->ackm_pkt.is_inflight = 1;
874         }
875 
876         /*
877          * If we have failed to make a datagram of adequate size, for example
878          * because we have a padding requirement but are using the ACK_ONLY
879          * archetype (because we are CC limited), which precludes us from
880          * sending padding, give up on generating the datagram - there is
881          * nothing we can do.
882          */
883         if (total_dgram_size < min_dpl) {
884             res = 1;
885             goto out;
886         }
887     }
888 
889     /* 4. Commit */
890     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
891          enc_level < QUIC_ENC_LEVEL_NUM;
892          ++enc_level) {
893 
894         if (!pkt[enc_level].h_valid)
895             /* Did not attempt to generate a packet for this EL. */
896             continue;
897 
898         if (pkt[enc_level].h.bytes_appended == 0)
899             /* Nothing was generated for this EL, so skip. */
900             continue;
901 
902         rc = txp_pkt_commit(txp, &pkt[enc_level], archetype,
903                             &txpim_pkt_reffed);
904         if (rc) {
905             status->sent_ack_eliciting
906                 = status->sent_ack_eliciting
907                 || pkt[enc_level].tpkt->ackm_pkt.is_ack_eliciting;
908 
909             if (enc_level == QUIC_ENC_LEVEL_HANDSHAKE)
910                 status->sent_handshake
911                     = (pkt[enc_level].h_valid
912                        && pkt[enc_level].h.bytes_appended > 0);
913         }
914 
915         if (txpim_pkt_reffed)
916             pkt[enc_level].tpkt = NULL; /* don't free */
917 
918         if (!rc)
919             goto out;
920 
921         ++pkts_done;
922     }
923 
924     /* Flush & Cleanup */
925     res = 1;
926 out:
927     ossl_qtx_finish_dgram(txp->args.qtx);
928 
929     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
930          enc_level < QUIC_ENC_LEVEL_NUM;
931          ++enc_level)
932         txp_pkt_cleanup(&pkt[enc_level], txp);
933 
934     status->sent_pkt = pkts_done;
935 
936     return res;
937 }
938 
939 static const struct archetype_data archetypes[QUIC_ENC_LEVEL_NUM][TX_PACKETISER_ARCHETYPE_NUM] = {
940     /* EL 0(INITIAL) */
941     {
942         /* EL 0(INITIAL) - Archetype 0(NORMAL) */
943         {
944             /*allow_ack                       =*/ 1,
945             /*allow_ping                      =*/ 1,
946             /*allow_crypto                    =*/ 1,
947             /*allow_handshake_done            =*/ 0,
948             /*allow_path_challenge            =*/ 0,
949             /*allow_path_response             =*/ 0,
950             /*allow_new_conn_id               =*/ 0,
951             /*allow_retire_conn_id            =*/ 0,
952             /*allow_stream_rel                =*/ 0,
953             /*allow_conn_fc                   =*/ 0,
954             /*allow_conn_close                =*/ 1,
955             /*allow_cfq_other                 =*/ 0,
956             /*allow_new_token                 =*/ 0,
957             /*allow_force_ack_eliciting       =*/ 1,
958             /*allow_padding                   =*/ 1,
959             /*require_ack_eliciting           =*/ 0,
960             /*bypass_cc                       =*/ 0,
961         },
962         /* EL 0(INITIAL) - Archetype 1(PROBE) */
963         {
964             /*allow_ack                       =*/ 1,
965             /*allow_ping                      =*/ 1,
966             /*allow_crypto                    =*/ 1,
967             /*allow_handshake_done            =*/ 0,
968             /*allow_path_challenge            =*/ 0,
969             /*allow_path_response             =*/ 0,
970             /*allow_new_conn_id               =*/ 0,
971             /*allow_retire_conn_id            =*/ 0,
972             /*allow_stream_rel                =*/ 0,
973             /*allow_conn_fc                   =*/ 0,
974             /*allow_conn_close                =*/ 1,
975             /*allow_cfq_other                 =*/ 0,
976             /*allow_new_token                 =*/ 0,
977             /*allow_force_ack_eliciting       =*/ 1,
978             /*allow_padding                   =*/ 1,
979             /*require_ack_eliciting           =*/ 1,
980             /*bypass_cc                       =*/ 1,
981         },
982         /* EL 0(INITIAL) - Archetype 2(ACK_ONLY) */
983         {
984             /*allow_ack                       =*/ 1,
985             /*allow_ping                      =*/ 0,
986             /*allow_crypto                    =*/ 0,
987             /*allow_handshake_done            =*/ 0,
988             /*allow_path_challenge            =*/ 0,
989             /*allow_path_response             =*/ 0,
990             /*allow_new_conn_id               =*/ 0,
991             /*allow_retire_conn_id            =*/ 0,
992             /*allow_stream_rel                =*/ 0,
993             /*allow_conn_fc                   =*/ 0,
994             /*allow_conn_close                =*/ 0,
995             /*allow_cfq_other                 =*/ 0,
996             /*allow_new_token                 =*/ 0,
997             /*allow_force_ack_eliciting       =*/ 1,
998             /*allow_padding                   =*/ 0,
999             /*require_ack_eliciting           =*/ 0,
1000             /*bypass_cc                       =*/ 1,
1001         },
1002     },
1003     /* EL 1(HANDSHAKE) */
1004     {
1005         /* EL 1(HANDSHAKE) - Archetype 0(NORMAL) */
1006         {
1007             /*allow_ack                       =*/ 1,
1008             /*allow_ping                      =*/ 1,
1009             /*allow_crypto                    =*/ 1,
1010             /*allow_handshake_done            =*/ 0,
1011             /*allow_path_challenge            =*/ 0,
1012             /*allow_path_response             =*/ 0,
1013             /*allow_new_conn_id               =*/ 0,
1014             /*allow_retire_conn_id            =*/ 0,
1015             /*allow_stream_rel                =*/ 0,
1016             /*allow_conn_fc                   =*/ 0,
1017             /*allow_conn_close                =*/ 1,
1018             /*allow_cfq_other                 =*/ 0,
1019             /*allow_new_token                 =*/ 0,
1020             /*allow_force_ack_eliciting       =*/ 1,
1021             /*allow_padding                   =*/ 1,
1022             /*require_ack_eliciting           =*/ 0,
1023             /*bypass_cc                       =*/ 0,
1024         },
1025         /* EL 1(HANDSHAKE) - Archetype 1(PROBE) */
1026         {
1027             /*allow_ack                       =*/ 1,
1028             /*allow_ping                      =*/ 1,
1029             /*allow_crypto                    =*/ 1,
1030             /*allow_handshake_done            =*/ 0,
1031             /*allow_path_challenge            =*/ 0,
1032             /*allow_path_response             =*/ 0,
1033             /*allow_new_conn_id               =*/ 0,
1034             /*allow_retire_conn_id            =*/ 0,
1035             /*allow_stream_rel                =*/ 0,
1036             /*allow_conn_fc                   =*/ 0,
1037             /*allow_conn_close                =*/ 1,
1038             /*allow_cfq_other                 =*/ 0,
1039             /*allow_new_token                 =*/ 0,
1040             /*allow_force_ack_eliciting       =*/ 1,
1041             /*allow_padding                   =*/ 1,
1042             /*require_ack_eliciting           =*/ 1,
1043             /*bypass_cc                       =*/ 1,
1044         },
1045         /* EL 1(HANDSHAKE) - Archetype 2(ACK_ONLY) */
1046         {
1047             /*allow_ack                       =*/ 1,
1048             /*allow_ping                      =*/ 0,
1049             /*allow_crypto                    =*/ 0,
1050             /*allow_handshake_done            =*/ 0,
1051             /*allow_path_challenge            =*/ 0,
1052             /*allow_path_response             =*/ 0,
1053             /*allow_new_conn_id               =*/ 0,
1054             /*allow_retire_conn_id            =*/ 0,
1055             /*allow_stream_rel                =*/ 0,
1056             /*allow_conn_fc                   =*/ 0,
1057             /*allow_conn_close                =*/ 0,
1058             /*allow_cfq_other                 =*/ 0,
1059             /*allow_new_token                 =*/ 0,
1060             /*allow_force_ack_eliciting       =*/ 1,
1061             /*allow_padding                   =*/ 0,
1062             /*require_ack_eliciting           =*/ 0,
1063             /*bypass_cc                       =*/ 1,
1064         },
1065     },
1066     /* EL 2(0RTT) */
1067     {
1068         /* EL 2(0RTT) - Archetype 0(NORMAL) */
1069         {
1070             /*allow_ack                       =*/ 0,
1071             /*allow_ping                      =*/ 1,
1072             /*allow_crypto                    =*/ 0,
1073             /*allow_handshake_done            =*/ 0,
1074             /*allow_path_challenge            =*/ 0,
1075             /*allow_path_response             =*/ 0,
1076             /*allow_new_conn_id               =*/ 1,
1077             /*allow_retire_conn_id            =*/ 1,
1078             /*allow_stream_rel                =*/ 1,
1079             /*allow_conn_fc                   =*/ 1,
1080             /*allow_conn_close                =*/ 1,
1081             /*allow_cfq_other                 =*/ 0,
1082             /*allow_new_token                 =*/ 0,
1083             /*allow_force_ack_eliciting       =*/ 0,
1084             /*allow_padding                   =*/ 1,
1085             /*require_ack_eliciting           =*/ 0,
1086             /*bypass_cc                       =*/ 0,
1087         },
1088         /* EL 2(0RTT) - Archetype 1(PROBE) */
1089         {
1090             /*allow_ack                       =*/ 0,
1091             /*allow_ping                      =*/ 1,
1092             /*allow_crypto                    =*/ 0,
1093             /*allow_handshake_done            =*/ 0,
1094             /*allow_path_challenge            =*/ 0,
1095             /*allow_path_response             =*/ 0,
1096             /*allow_new_conn_id               =*/ 1,
1097             /*allow_retire_conn_id            =*/ 1,
1098             /*allow_stream_rel                =*/ 1,
1099             /*allow_conn_fc                   =*/ 1,
1100             /*allow_conn_close                =*/ 1,
1101             /*allow_cfq_other                 =*/ 0,
1102             /*allow_new_token                 =*/ 0,
1103             /*allow_force_ack_eliciting       =*/ 0,
1104             /*allow_padding                   =*/ 1,
1105             /*require_ack_eliciting           =*/ 1,
1106             /*bypass_cc                       =*/ 1,
1107         },
1108         /* EL 2(0RTT) - Archetype 2(ACK_ONLY) */
1109         {
1110             /*allow_ack                       =*/ 0,
1111             /*allow_ping                      =*/ 0,
1112             /*allow_crypto                    =*/ 0,
1113             /*allow_handshake_done            =*/ 0,
1114             /*allow_path_challenge            =*/ 0,
1115             /*allow_path_response             =*/ 0,
1116             /*allow_new_conn_id               =*/ 0,
1117             /*allow_retire_conn_id            =*/ 0,
1118             /*allow_stream_rel                =*/ 0,
1119             /*allow_conn_fc                   =*/ 0,
1120             /*allow_conn_close                =*/ 0,
1121             /*allow_cfq_other                 =*/ 0,
1122             /*allow_new_token                 =*/ 0,
1123             /*allow_force_ack_eliciting       =*/ 0,
1124             /*allow_padding                   =*/ 0,
1125             /*require_ack_eliciting           =*/ 0,
1126             /*bypass_cc                       =*/ 1,
1127         },
1128     },
1129     /* EL 3(1RTT) */
1130     {
1131         /* EL 3(1RTT) - Archetype 0(NORMAL) */
1132         {
1133             /*allow_ack                       =*/ 1,
1134             /*allow_ping                      =*/ 1,
1135             /*allow_crypto                    =*/ 1,
1136             /*allow_handshake_done            =*/ 1,
1137             /*allow_path_challenge            =*/ 0,
1138             /*allow_path_response             =*/ 1,
1139             /*allow_new_conn_id               =*/ 1,
1140             /*allow_retire_conn_id            =*/ 1,
1141             /*allow_stream_rel                =*/ 1,
1142             /*allow_conn_fc                   =*/ 1,
1143             /*allow_conn_close                =*/ 1,
1144             /*allow_cfq_other                 =*/ 1,
1145             /*allow_new_token                 =*/ 1,
1146             /*allow_force_ack_eliciting       =*/ 1,
1147             /*allow_padding                   =*/ 1,
1148             /*require_ack_eliciting           =*/ 0,
1149             /*bypass_cc                       =*/ 0,
1150         },
1151         /* EL 3(1RTT) - Archetype 1(PROBE) */
1152         {
1153             /*allow_ack                       =*/ 1,
1154             /*allow_ping                      =*/ 1,
1155             /*allow_crypto                    =*/ 1,
1156             /*allow_handshake_done            =*/ 1,
1157             /*allow_path_challenge            =*/ 0,
1158             /*allow_path_response             =*/ 1,
1159             /*allow_new_conn_id               =*/ 1,
1160             /*allow_retire_conn_id            =*/ 1,
1161             /*allow_stream_rel                =*/ 1,
1162             /*allow_conn_fc                   =*/ 1,
1163             /*allow_conn_close                =*/ 1,
1164             /*allow_cfq_other                 =*/ 1,
1165             /*allow_new_token                 =*/ 1,
1166             /*allow_force_ack_eliciting       =*/ 1,
1167             /*allow_padding                   =*/ 1,
1168             /*require_ack_eliciting           =*/ 1,
1169             /*bypass_cc                       =*/ 1,
1170         },
1171         /* EL 3(1RTT) - Archetype 2(ACK_ONLY) */
1172         {
1173             /*allow_ack                       =*/ 1,
1174             /*allow_ping                      =*/ 0,
1175             /*allow_crypto                    =*/ 0,
1176             /*allow_handshake_done            =*/ 0,
1177             /*allow_path_challenge            =*/ 0,
1178             /*allow_path_response             =*/ 0,
1179             /*allow_new_conn_id               =*/ 0,
1180             /*allow_retire_conn_id            =*/ 0,
1181             /*allow_stream_rel                =*/ 0,
1182             /*allow_conn_fc                   =*/ 0,
1183             /*allow_conn_close                =*/ 0,
1184             /*allow_cfq_other                 =*/ 0,
1185             /*allow_new_token                 =*/ 0,
1186             /*allow_force_ack_eliciting       =*/ 1,
1187             /*allow_padding                   =*/ 0,
1188             /*require_ack_eliciting           =*/ 0,
1189             /*bypass_cc                       =*/ 1,
1190         }
1191     }
1192 };
1193 
txp_get_archetype_data(uint32_t enc_level,uint32_t archetype,struct archetype_data * a)1194 static int txp_get_archetype_data(uint32_t enc_level,
1195                                   uint32_t archetype,
1196                                   struct archetype_data *a)
1197 {
1198     if (enc_level >= QUIC_ENC_LEVEL_NUM
1199         || archetype >= TX_PACKETISER_ARCHETYPE_NUM)
1200         return 0;
1201 
1202     /* No need to avoid copying this as it should not exceed one int in size. */
1203     *a = archetypes[enc_level][archetype];
1204     return 1;
1205 }
1206 
txp_determine_geometry(OSSL_QUIC_TX_PACKETISER * txp,uint32_t archetype,uint32_t enc_level,size_t running_total,QUIC_PKT_HDR * phdr,struct txp_pkt_geom * geom)1207 static int txp_determine_geometry(OSSL_QUIC_TX_PACKETISER *txp,
1208                                   uint32_t archetype,
1209                                   uint32_t enc_level,
1210                                   size_t running_total,
1211                                   QUIC_PKT_HDR *phdr,
1212                                   struct txp_pkt_geom *geom)
1213 {
1214     size_t mdpl, cmpl, hdr_len;
1215 
1216     /* Get information about packet archetype. */
1217     if (!txp_get_archetype_data(enc_level, archetype, &geom->adata))
1218        return 0;
1219 
1220     /* Assemble packet header. */
1221     phdr->type          = ossl_quic_enc_level_to_pkt_type(enc_level);
1222     phdr->spin_bit      = 0;
1223     phdr->pn_len        = txp_determine_pn_len(txp);
1224     phdr->partial       = 0;
1225     phdr->fixed         = 1;
1226     phdr->reserved      = 0;
1227     phdr->version       = QUIC_VERSION_1;
1228     phdr->dst_conn_id   = txp->args.cur_dcid;
1229     phdr->src_conn_id   = txp->args.cur_scid;
1230 
1231     /*
1232      * We need to know the length of the payload to get an accurate header
1233      * length for non-1RTT packets, because the Length field found in
1234      * Initial/Handshake/0-RTT packets uses a variable-length encoding. However,
1235      * we don't have a good idea of the length of our payload, because the
1236      * length of the payload depends on the room in the datagram after fitting
1237      * the header, which depends on the size of the header.
1238      *
1239      * In general, it does not matter if a packet is slightly shorter (because
1240      * e.g. we predicted use of a 2-byte length field, but ended up only needing
1241      * a 1-byte length field). However this does matter for Initial packets
1242      * which must be at least 1200 bytes, which is also the assumed default MTU;
1243      * therefore in many cases Initial packets will be padded to 1200 bytes,
1244      * which means if we overestimated the header size, we will be short by a
1245      * few bytes and the server will ignore the packet for being too short. In
1246      * this case, however, such packets always *will* be padded to meet 1200
1247      * bytes, which requires a 2-byte length field, so we don't actually need to
1248      * worry about this. Thus we estimate the header length assuming a 2-byte
1249      * length field here, which should in practice work well in all cases.
1250      */
1251     phdr->len           = OSSL_QUIC_VLINT_2B_MAX - phdr->pn_len;
1252 
1253     if (enc_level == QUIC_ENC_LEVEL_INITIAL) {
1254         phdr->token     = txp->initial_token;
1255         phdr->token_len = txp->initial_token_len;
1256     } else {
1257         phdr->token     = NULL;
1258         phdr->token_len = 0;
1259     }
1260 
1261     hdr_len = ossl_quic_wire_get_encoded_pkt_hdr_len(phdr->dst_conn_id.id_len,
1262                                                      phdr);
1263     if (hdr_len == 0)
1264         return 0;
1265 
1266     /* MDPL: Maximum datagram payload length. */
1267     mdpl = txp_get_mdpl(txp);
1268 
1269     /*
1270      * CMPL: Maximum encoded packet size we can put into this datagram given any
1271      * previous packets coalesced into it.
1272      */
1273     if (running_total > mdpl)
1274         /* Should not be possible, but if it happens: */
1275         cmpl = 0;
1276     else
1277         cmpl = mdpl - running_total;
1278 
1279     /* CMPPL: Maximum amount we can put into the current packet payload */
1280     if (!txp_determine_ppl_from_pl(txp, cmpl, enc_level, hdr_len, &geom->cmppl))
1281         return 0;
1282 
1283     geom->cmpl                  = cmpl;
1284     geom->pkt_overhead          = cmpl - geom->cmppl;
1285     geom->archetype             = archetype;
1286     return 1;
1287 }
1288 
txp_determine_archetype(OSSL_QUIC_TX_PACKETISER * txp,uint64_t cc_limit)1289 static uint32_t txp_determine_archetype(OSSL_QUIC_TX_PACKETISER *txp,
1290                                         uint64_t cc_limit)
1291 {
1292     OSSL_ACKM_PROBE_INFO *probe_info
1293         = ossl_ackm_get0_probe_request(txp->args.ackm);
1294     uint32_t pn_space;
1295 
1296     /*
1297      * If ACKM has requested probe generation (e.g. due to PTO), we generate a
1298      * Probe-archetype packet. Actually, we determine archetype on a
1299      * per-datagram basis, so if any EL wants a probe, do a pass in which
1300      * we try and generate a probe (if needed) for all ELs.
1301      */
1302     if (probe_info->anti_deadlock_initial > 0
1303         || probe_info->anti_deadlock_handshake > 0)
1304         return TX_PACKETISER_ARCHETYPE_PROBE;
1305 
1306     for (pn_space = QUIC_PN_SPACE_INITIAL;
1307          pn_space < QUIC_PN_SPACE_NUM;
1308          ++pn_space)
1309         if (probe_info->pto[pn_space] > 0)
1310             return TX_PACKETISER_ARCHETYPE_PROBE;
1311 
1312     /*
1313      * If we are out of CC budget, we cannot send a normal packet,
1314      * but we can do an ACK-only packet (potentially, if we
1315      * want to send an ACK).
1316      */
1317     if (cc_limit == 0)
1318         return TX_PACKETISER_ARCHETYPE_ACK_ONLY;
1319 
1320     /* All other packets. */
1321     return TX_PACKETISER_ARCHETYPE_NORMAL;
1322 }
1323 
txp_should_try_staging(OSSL_QUIC_TX_PACKETISER * txp,uint32_t enc_level,uint32_t archetype,uint64_t cc_limit,uint32_t * conn_close_enc_level)1324 static int txp_should_try_staging(OSSL_QUIC_TX_PACKETISER *txp,
1325                                   uint32_t enc_level,
1326                                   uint32_t archetype,
1327                                   uint64_t cc_limit,
1328                                   uint32_t *conn_close_enc_level)
1329 {
1330     struct archetype_data a;
1331     uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
1332     QUIC_CFQ_ITEM *cfq_item;
1333 
1334     if (!ossl_qtx_is_enc_level_provisioned(txp->args.qtx, enc_level))
1335         return 0;
1336 
1337     if (!txp_get_archetype_data(enc_level, archetype, &a))
1338         return 0;
1339 
1340     if (!a.bypass_cc && cc_limit == 0)
1341         /* CC not allowing us to send. */
1342         return 0;
1343 
1344     /*
1345      * We can produce CONNECTION_CLOSE frames on any EL in principle, which
1346      * means we need to choose which EL we would prefer to use. After a
1347      * connection is fully established we have only one provisioned EL and this
1348      * is a non-issue. Where multiple ELs are provisioned, it is possible the
1349      * peer does not have the keys for the EL yet, which suggests in general it
1350      * is preferable to use the lowest EL which is still provisioned.
1351      *
1352      * However (RFC 9000 s. 10.2.3 & 12.5) we are also required to not send
1353      * application CONNECTION_CLOSE frames in non-1-RTT ELs, so as to not
1354      * potentially leak application data on a connection which has yet to be
1355      * authenticated. Thus when we have an application CONNECTION_CLOSE frame
1356      * queued and need to send it on a non-1-RTT EL, we have to convert it
1357      * into a transport CONNECTION_CLOSE frame which contains no application
1358      * data. Since this loses information, it suggests we should use the 1-RTT
1359      * EL to avoid this if possible, even if a lower EL is also available.
1360      *
1361      * At the same time, just because we have the 1-RTT EL provisioned locally
1362      * does not necessarily mean the peer does, for example if a handshake
1363      * CRYPTO frame has been lost. It is fairly important that CONNECTION_CLOSE
1364      * is signalled in a way we know our peer can decrypt, as we stop processing
1365      * connection retransmission logic for real after connection close and
1366      * simply 'blindly' retransmit the same CONNECTION_CLOSE frame.
1367      *
1368      * This is not a major concern for clients, since if a client has a 1-RTT EL
1369      * provisioned the server is guaranteed to also have a 1-RTT EL provisioned.
1370      *
1371      * TODO(QUIC SERVER): Revisit this when server support is added.
1372      */
1373     if (*conn_close_enc_level > enc_level
1374         && *conn_close_enc_level != QUIC_ENC_LEVEL_1RTT)
1375         *conn_close_enc_level = enc_level;
1376 
1377     /* Do we need to send a PTO probe? */
1378     if (a.allow_force_ack_eliciting) {
1379         OSSL_ACKM_PROBE_INFO *probe_info
1380             = ossl_ackm_get0_probe_request(txp->args.ackm);
1381 
1382         if ((enc_level == QUIC_ENC_LEVEL_INITIAL
1383              && probe_info->anti_deadlock_initial > 0)
1384             || (enc_level == QUIC_ENC_LEVEL_HANDSHAKE
1385                 && probe_info->anti_deadlock_handshake > 0)
1386             || probe_info->pto[pn_space] > 0)
1387             return 1;
1388     }
1389 
1390     /* Does the crypto stream for this EL want to produce anything? */
1391     if (a.allow_crypto && sstream_is_pending(txp->args.crypto[pn_space]))
1392         return 1;
1393 
1394     /* Does the ACKM for this PN space want to produce anything? */
1395     if (a.allow_ack && (ossl_ackm_is_ack_desired(txp->args.ackm, pn_space)
1396                         || (txp->want_ack & (1UL << pn_space)) != 0))
1397         return 1;
1398 
1399     /* Do we need to force emission of an ACK-eliciting packet? */
1400     if (a.allow_force_ack_eliciting
1401         && (txp->force_ack_eliciting & (1UL << pn_space)) != 0)
1402         return 1;
1403 
1404     /* Does the connection-level RXFC want to produce a frame? */
1405     if (a.allow_conn_fc && (txp->want_max_data
1406         || ossl_quic_rxfc_has_cwm_changed(txp->args.conn_rxfc, 0)))
1407         return 1;
1408 
1409     /* Do we want to produce a MAX_STREAMS frame? */
1410     if (a.allow_conn_fc
1411         && (txp->want_max_streams_bidi
1412             || ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_bidi_rxfc,
1413                                               0)
1414             || txp->want_max_streams_uni
1415             || ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_uni_rxfc,
1416                                               0)))
1417         return 1;
1418 
1419     /* Do we want to produce a HANDSHAKE_DONE frame? */
1420     if (a.allow_handshake_done && txp->want_handshake_done)
1421         return 1;
1422 
1423     /* Do we want to produce a CONNECTION_CLOSE frame? */
1424     if (a.allow_conn_close && txp->want_conn_close &&
1425         *conn_close_enc_level == enc_level)
1426         /*
1427          * This is a bit of a special case since CONNECTION_CLOSE can appear in
1428          * most packet types, and when we decide we want to send it this status
1429          * isn't tied to a specific EL. So if we want to send it, we send it
1430          * only on the lowest non-dropped EL.
1431          */
1432         return 1;
1433 
1434     /* Does the CFQ have any frames queued for this PN space? */
1435     if (enc_level != QUIC_ENC_LEVEL_0RTT)
1436         for (cfq_item = ossl_quic_cfq_get_priority_head(txp->args.cfq, pn_space);
1437              cfq_item != NULL;
1438              cfq_item = ossl_quic_cfq_item_get_priority_next(cfq_item, pn_space)) {
1439             uint64_t frame_type = ossl_quic_cfq_item_get_frame_type(cfq_item);
1440 
1441             switch (frame_type) {
1442             case OSSL_QUIC_FRAME_TYPE_NEW_CONN_ID:
1443                 if (a.allow_new_conn_id)
1444                     return 1;
1445                 break;
1446             case OSSL_QUIC_FRAME_TYPE_RETIRE_CONN_ID:
1447                 if (a.allow_retire_conn_id)
1448                     return 1;
1449                 break;
1450             case OSSL_QUIC_FRAME_TYPE_NEW_TOKEN:
1451                 if (a.allow_new_token)
1452                     return 1;
1453                 break;
1454             case OSSL_QUIC_FRAME_TYPE_PATH_RESPONSE:
1455                 if (a.allow_path_response)
1456                     return 1;
1457                 break;
1458             default:
1459                 if (a.allow_cfq_other)
1460                     return 1;
1461                 break;
1462             }
1463        }
1464 
1465     if (a.allow_stream_rel && txp->handshake_complete) {
1466         QUIC_STREAM_ITER it;
1467 
1468         /* If there are any active streams, 0/1-RTT wants to produce a packet.
1469          * Whether a stream is on the active list is required to be precise
1470          * (i.e., a stream is never on the active list if we cannot produce a
1471          * frame for it), and all stream-related frames are governed by
1472          * a.allow_stream_rel (i.e., if we can send one type of stream-related
1473          * frame, we can send any of them), so we don't need to inspect
1474          * individual streams on the active list, just confirm that the active
1475          * list is non-empty.
1476          */
1477         ossl_quic_stream_iter_init(&it, txp->args.qsm, 0);
1478         if (it.stream != NULL)
1479             return 1;
1480     }
1481 
1482     return 0;
1483 }
1484 
sstream_is_pending(QUIC_SSTREAM * sstream)1485 static int sstream_is_pending(QUIC_SSTREAM *sstream)
1486 {
1487     OSSL_QUIC_FRAME_STREAM hdr;
1488     OSSL_QTX_IOVEC iov[2];
1489     size_t num_iov = OSSL_NELEM(iov);
1490 
1491     return ossl_quic_sstream_get_stream_frame(sstream, 0, &hdr, iov, &num_iov);
1492 }
1493 
1494 /* Determine how many bytes we should use for the encoded PN. */
txp_determine_pn_len(OSSL_QUIC_TX_PACKETISER * txp)1495 static size_t txp_determine_pn_len(OSSL_QUIC_TX_PACKETISER *txp)
1496 {
1497     return 4; /* TODO(QUIC FUTURE) */
1498 }
1499 
1500 /* Determine plaintext packet payload length from payload length. */
txp_determine_ppl_from_pl(OSSL_QUIC_TX_PACKETISER * txp,size_t pl,uint32_t enc_level,size_t hdr_len,size_t * r)1501 static int txp_determine_ppl_from_pl(OSSL_QUIC_TX_PACKETISER *txp,
1502                                      size_t pl,
1503                                      uint32_t enc_level,
1504                                      size_t hdr_len,
1505                                      size_t *r)
1506 {
1507     if (pl < hdr_len)
1508         return 0;
1509 
1510     pl -= hdr_len;
1511 
1512     if (!ossl_qtx_calculate_plaintext_payload_len(txp->args.qtx, enc_level,
1513                                                   pl, &pl))
1514         return 0;
1515 
1516     *r = pl;
1517     return 1;
1518 }
1519 
txp_get_mdpl(OSSL_QUIC_TX_PACKETISER * txp)1520 static size_t txp_get_mdpl(OSSL_QUIC_TX_PACKETISER *txp)
1521 {
1522     return ossl_qtx_get_mdpl(txp->args.qtx);
1523 }
1524 
get_sstream_by_id(uint64_t stream_id,uint32_t pn_space,void * arg)1525 static QUIC_SSTREAM *get_sstream_by_id(uint64_t stream_id, uint32_t pn_space,
1526                                        void *arg)
1527 {
1528     OSSL_QUIC_TX_PACKETISER *txp = arg;
1529     QUIC_STREAM *s;
1530 
1531     if (stream_id == UINT64_MAX)
1532         return txp->args.crypto[pn_space];
1533 
1534     s = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1535     if (s == NULL)
1536         return NULL;
1537 
1538     return s->sstream;
1539 }
1540 
on_regen_notify(uint64_t frame_type,uint64_t stream_id,QUIC_TXPIM_PKT * pkt,void * arg)1541 static void on_regen_notify(uint64_t frame_type, uint64_t stream_id,
1542                             QUIC_TXPIM_PKT *pkt, void *arg)
1543 {
1544     OSSL_QUIC_TX_PACKETISER *txp = arg;
1545 
1546     switch (frame_type) {
1547         case OSSL_QUIC_FRAME_TYPE_HANDSHAKE_DONE:
1548             txp->want_handshake_done = 1;
1549             break;
1550         case OSSL_QUIC_FRAME_TYPE_MAX_DATA:
1551             txp->want_max_data = 1;
1552             break;
1553         case OSSL_QUIC_FRAME_TYPE_MAX_STREAMS_BIDI:
1554             txp->want_max_streams_bidi = 1;
1555             break;
1556         case OSSL_QUIC_FRAME_TYPE_MAX_STREAMS_UNI:
1557             txp->want_max_streams_uni = 1;
1558             break;
1559         case OSSL_QUIC_FRAME_TYPE_ACK_WITH_ECN:
1560             txp->want_ack |= (1UL << pkt->ackm_pkt.pkt_space);
1561             break;
1562         case OSSL_QUIC_FRAME_TYPE_MAX_STREAM_DATA:
1563             {
1564                 QUIC_STREAM *s
1565                     = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1566 
1567                 if (s == NULL)
1568                     return;
1569 
1570                 s->want_max_stream_data = 1;
1571                 ossl_quic_stream_map_update_state(txp->args.qsm, s);
1572             }
1573             break;
1574         case OSSL_QUIC_FRAME_TYPE_STOP_SENDING:
1575             {
1576                 QUIC_STREAM *s
1577                     = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1578 
1579                 if (s == NULL)
1580                     return;
1581 
1582                 ossl_quic_stream_map_schedule_stop_sending(txp->args.qsm, s);
1583             }
1584             break;
1585         case OSSL_QUIC_FRAME_TYPE_RESET_STREAM:
1586             {
1587                 QUIC_STREAM *s
1588                     = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1589 
1590                 if (s == NULL)
1591                     return;
1592 
1593                 s->want_reset_stream = 1;
1594                 ossl_quic_stream_map_update_state(txp->args.qsm, s);
1595             }
1596             break;
1597         default:
1598             assert(0);
1599             break;
1600     }
1601 }
1602 
txp_need_ping(OSSL_QUIC_TX_PACKETISER * txp,uint32_t pn_space,const struct archetype_data * adata)1603 static int txp_need_ping(OSSL_QUIC_TX_PACKETISER *txp,
1604                          uint32_t pn_space,
1605                          const struct archetype_data *adata)
1606 {
1607     return adata->allow_ping
1608         && (adata->require_ack_eliciting
1609             || (txp->force_ack_eliciting & (1UL << pn_space)) != 0);
1610 }
1611 
txp_pkt_init(struct txp_pkt * pkt,OSSL_QUIC_TX_PACKETISER * txp,uint32_t enc_level,uint32_t archetype,size_t running_total)1612 static int txp_pkt_init(struct txp_pkt *pkt, OSSL_QUIC_TX_PACKETISER *txp,
1613                         uint32_t enc_level, uint32_t archetype,
1614                         size_t running_total)
1615 {
1616     uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
1617 
1618     if (!txp_determine_geometry(txp, archetype, enc_level,
1619                                 running_total, &pkt->phdr, &pkt->geom))
1620         return 0;
1621 
1622     /*
1623      * Initialise TX helper. If we must be ACK eliciting, reserve 1 byte for
1624      * PING.
1625      */
1626     if (!tx_helper_init(&pkt->h, txp, enc_level,
1627                         pkt->geom.cmppl,
1628                         txp_need_ping(txp, pn_space, &pkt->geom.adata) ? 1 : 0))
1629         return 0;
1630 
1631     pkt->h_valid            = 1;
1632     pkt->tpkt               = NULL;
1633     pkt->stream_head        = NULL;
1634     pkt->force_pad          = 0;
1635     return 1;
1636 }
1637 
txp_pkt_cleanup(struct txp_pkt * pkt,OSSL_QUIC_TX_PACKETISER * txp)1638 static void txp_pkt_cleanup(struct txp_pkt *pkt, OSSL_QUIC_TX_PACKETISER *txp)
1639 {
1640     if (!pkt->h_valid)
1641         return;
1642 
1643     tx_helper_cleanup(&pkt->h);
1644     pkt->h_valid = 0;
1645 
1646     if (pkt->tpkt != NULL) {
1647         ossl_quic_txpim_pkt_release(txp->args.txpim, pkt->tpkt);
1648         pkt->tpkt = NULL;
1649     }
1650 }
1651 
txp_pkt_postgen_update_pkt_overhead(struct txp_pkt * pkt,OSSL_QUIC_TX_PACKETISER * txp)1652 static int txp_pkt_postgen_update_pkt_overhead(struct txp_pkt *pkt,
1653                                                OSSL_QUIC_TX_PACKETISER *txp)
1654 {
1655     /*
1656      * After we have staged and generated our packets, but before we commit
1657      * them, it is possible for the estimated packet overhead (packet header +
1658      * AEAD tag size) to shrink slightly because we generated a short packet
1659      * whose which can be represented in fewer bytes as a variable-length
1660      * integer than we were (pessimistically) budgeting for. We need to account
1661      * for this to ensure that we get our padding calculation exactly right.
1662      *
1663      * Update pkt_overhead to be accurate now that we know how much data is
1664      * going in a packet.
1665      */
1666     size_t hdr_len, ciphertext_len;
1667 
1668     if (pkt->h.enc_level == QUIC_ENC_LEVEL_INITIAL)
1669         /*
1670          * Don't update overheads for the INITIAL EL - we have not finished
1671          * appending padding to it and would potentially miscalculate the
1672          * correct padding if we now update the pkt_overhead field to switch to
1673          * e.g. a 1-byte length field in the packet header. Since we are padding
1674          * to QUIC_MIN_INITIAL_DGRAM_LEN which requires a 2-byte length field,
1675          * this is guaranteed to be moot anyway. See comment in
1676          * txp_determine_geometry for more information.
1677          */
1678         return 1;
1679 
1680     if (!ossl_qtx_calculate_ciphertext_payload_len(txp->args.qtx, pkt->h.enc_level,
1681                                                    pkt->h.bytes_appended,
1682                                                    &ciphertext_len))
1683         return 0;
1684 
1685     pkt->phdr.len = ciphertext_len;
1686 
1687     hdr_len = ossl_quic_wire_get_encoded_pkt_hdr_len(pkt->phdr.dst_conn_id.id_len,
1688                                                      &pkt->phdr);
1689 
1690     pkt->geom.pkt_overhead = hdr_len + ciphertext_len - pkt->h.bytes_appended;
1691     return 1;
1692 }
1693 
on_confirm_notify(uint64_t frame_type,uint64_t stream_id,QUIC_TXPIM_PKT * pkt,void * arg)1694 static void on_confirm_notify(uint64_t frame_type, uint64_t stream_id,
1695                               QUIC_TXPIM_PKT *pkt, void *arg)
1696 {
1697     OSSL_QUIC_TX_PACKETISER *txp = arg;
1698 
1699     switch (frame_type) {
1700         case OSSL_QUIC_FRAME_TYPE_STOP_SENDING:
1701             {
1702                 QUIC_STREAM *s
1703                     = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1704 
1705                 if (s == NULL)
1706                     return;
1707 
1708                 s->acked_stop_sending = 1;
1709                 ossl_quic_stream_map_update_state(txp->args.qsm, s);
1710             }
1711             break;
1712         case OSSL_QUIC_FRAME_TYPE_RESET_STREAM:
1713             {
1714                 QUIC_STREAM *s
1715                     = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1716 
1717                 if (s == NULL)
1718                     return;
1719 
1720                 /*
1721                  * We must already be in RESET_SENT or RESET_RECVD if we are
1722                  * here, so we don't need to check state here.
1723                  */
1724                 ossl_quic_stream_map_notify_reset_stream_acked(txp->args.qsm, s);
1725                 ossl_quic_stream_map_update_state(txp->args.qsm, s);
1726             }
1727             break;
1728         default:
1729             assert(0);
1730             break;
1731     }
1732 }
1733 
txp_pkt_append_padding(struct txp_pkt * pkt,OSSL_QUIC_TX_PACKETISER * txp,size_t num_bytes)1734 static int txp_pkt_append_padding(struct txp_pkt *pkt,
1735                                   OSSL_QUIC_TX_PACKETISER *txp, size_t num_bytes)
1736 {
1737     WPACKET *wpkt;
1738 
1739     if (num_bytes == 0)
1740         return 1;
1741 
1742     if (!ossl_assert(pkt->h_valid))
1743         return 0;
1744 
1745     if (!ossl_assert(pkt->tpkt != NULL))
1746         return 0;
1747 
1748     wpkt = tx_helper_begin(&pkt->h);
1749     if (wpkt == NULL)
1750         return 0;
1751 
1752     if (!ossl_quic_wire_encode_padding(wpkt, num_bytes)) {
1753         tx_helper_rollback(&pkt->h);
1754         return 0;
1755     }
1756 
1757     if (!tx_helper_commit(&pkt->h))
1758         return 0;
1759 
1760     pkt->tpkt->ackm_pkt.num_bytes      += num_bytes;
1761     /* Cannot be non-inflight if we have a PADDING frame */
1762     pkt->tpkt->ackm_pkt.is_inflight     = 1;
1763     return 1;
1764 }
1765 
on_sstream_updated(uint64_t stream_id,void * arg)1766 static void on_sstream_updated(uint64_t stream_id, void *arg)
1767 {
1768     OSSL_QUIC_TX_PACKETISER *txp = arg;
1769     QUIC_STREAM *s;
1770 
1771     s = ossl_quic_stream_map_get_by_id(txp->args.qsm, stream_id);
1772     if (s == NULL)
1773         return;
1774 
1775     ossl_quic_stream_map_update_state(txp->args.qsm, s);
1776 }
1777 
1778 /*
1779  * Returns 1 if we can send that many bytes in closing state, 0 otherwise.
1780  * Also maintains the bytes sent state if it returns a success.
1781  */
try_commit_conn_close(OSSL_QUIC_TX_PACKETISER * txp,size_t n)1782 static int try_commit_conn_close(OSSL_QUIC_TX_PACKETISER *txp, size_t n)
1783 {
1784     int res;
1785 
1786     /* We can always send the first connection close frame */
1787     if (txp->closing_bytes_recv == 0)
1788         return 1;
1789 
1790     /*
1791      * RFC 9000 s. 10.2.1 Closing Connection State:
1792      *      To avoid being used for an amplification attack, such
1793      *      endpoints MUST limit the cumulative size of packets it sends
1794      *      to three times the cumulative size of the packets that are
1795      *      received and attributed to the connection.
1796      * and:
1797      *      An endpoint in the closing state MUST either discard packets
1798      *      received from an unvalidated address or limit the cumulative
1799      *      size of packets it sends to an unvalidated address to three
1800      *      times the size of packets it receives from that address.
1801      */
1802     res = txp->closing_bytes_xmit + n <= txp->closing_bytes_recv * 3;
1803 
1804     /*
1805      * Attribute the bytes to the connection, if we are allowed to send them
1806      * and this isn't the first closing frame.
1807      */
1808     if (res && txp->closing_bytes_recv != 0)
1809         txp->closing_bytes_xmit += n;
1810     return res;
1811 }
1812 
ossl_quic_tx_packetiser_record_received_closing_bytes(OSSL_QUIC_TX_PACKETISER * txp,size_t n)1813 void ossl_quic_tx_packetiser_record_received_closing_bytes(
1814         OSSL_QUIC_TX_PACKETISER *txp, size_t n)
1815 {
1816     txp->closing_bytes_recv += n;
1817 }
1818 
txp_generate_pre_token(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,int chosen_for_conn_close,int * can_be_non_inflight)1819 static int txp_generate_pre_token(OSSL_QUIC_TX_PACKETISER *txp,
1820                                   struct txp_pkt *pkt,
1821                                   int chosen_for_conn_close,
1822                                   int *can_be_non_inflight)
1823 {
1824     const uint32_t enc_level = pkt->h.enc_level;
1825     const uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
1826     const struct archetype_data *a = &pkt->geom.adata;
1827     QUIC_TXPIM_PKT *tpkt = pkt->tpkt;
1828     struct tx_helper *h = &pkt->h;
1829     const OSSL_QUIC_FRAME_ACK *ack;
1830     OSSL_QUIC_FRAME_ACK ack2;
1831 
1832     tpkt->ackm_pkt.largest_acked = QUIC_PN_INVALID;
1833 
1834     /* ACK Frames (Regenerate) */
1835     if (a->allow_ack
1836         && tx_helper_get_space_left(h) >= MIN_FRAME_SIZE_ACK
1837         && (((txp->want_ack & (1UL << pn_space)) != 0)
1838             || ossl_ackm_is_ack_desired(txp->args.ackm, pn_space))
1839         && (ack = ossl_ackm_get_ack_frame(txp->args.ackm, pn_space)) != NULL) {
1840         WPACKET *wpkt = tx_helper_begin(h);
1841 
1842         if (wpkt == NULL)
1843             return 0;
1844 
1845         /* We do not currently support ECN */
1846         ack2 = *ack;
1847         ack2.ecn_present = 0;
1848 
1849         if (ossl_quic_wire_encode_frame_ack(wpkt,
1850                                             txp->args.ack_delay_exponent,
1851                                             &ack2)) {
1852             if (!tx_helper_commit(h))
1853                 return 0;
1854 
1855             tpkt->had_ack_frame = 1;
1856 
1857             if (ack->num_ack_ranges > 0)
1858                 tpkt->ackm_pkt.largest_acked = ack->ack_ranges[0].end;
1859 
1860             if (txp->ack_tx_cb != NULL)
1861                 txp->ack_tx_cb(&ack2, pn_space, txp->ack_tx_cb_arg);
1862         } else {
1863             tx_helper_rollback(h);
1864         }
1865     }
1866 
1867     /* CONNECTION_CLOSE Frames (Regenerate) */
1868     if (a->allow_conn_close && txp->want_conn_close && chosen_for_conn_close) {
1869         WPACKET *wpkt = tx_helper_begin(h);
1870         OSSL_QUIC_FRAME_CONN_CLOSE f, *pf = &txp->conn_close_frame;
1871         size_t l;
1872 
1873         if (wpkt == NULL)
1874             return 0;
1875 
1876         /*
1877          * Application CONNECTION_CLOSE frames may only be sent in the
1878          * Application PN space, as otherwise they may be sent before a
1879          * connection is authenticated and leak application data. Therefore, if
1880          * we need to send a CONNECTION_CLOSE frame in another PN space and were
1881          * given an application CONNECTION_CLOSE frame, convert it into a
1882          * transport CONNECTION_CLOSE frame, removing any sensitive application
1883          * data.
1884          *
1885          * RFC 9000 s. 10.2.3: "A CONNECTION_CLOSE of type 0x1d MUST be replaced
1886          * by a CONNECTION_CLOSE of type 0x1c when sending the frame in Initial
1887          * or Handshake packets. Otherwise, information about the application
1888          * state might be revealed. Endpoints MUST clear the value of the Reason
1889          * Phrase field and SHOULD use the APPLICATION_ERROR code when
1890          * converting to a CONNECTION_CLOSE of type 0x1c."
1891          */
1892         if (pn_space != QUIC_PN_SPACE_APP && pf->is_app) {
1893             pf = &f;
1894             pf->is_app      = 0;
1895             pf->frame_type  = 0;
1896             pf->error_code  = OSSL_QUIC_ERR_APPLICATION_ERROR;
1897             pf->reason      = NULL;
1898             pf->reason_len  = 0;
1899         }
1900 
1901         if (ossl_quic_wire_encode_frame_conn_close(wpkt, pf)
1902                 && WPACKET_get_total_written(wpkt, &l)
1903                 && try_commit_conn_close(txp, l)) {
1904             if (!tx_helper_commit(h))
1905                 return 0;
1906 
1907             tpkt->had_conn_close = 1;
1908             *can_be_non_inflight = 0;
1909         } else {
1910             tx_helper_rollback(h);
1911         }
1912     }
1913 
1914     return 1;
1915 }
1916 
try_len(size_t space_left,size_t orig_len,size_t base_hdr_len,size_t lenbytes,uint64_t maxn,size_t * hdr_len,size_t * payload_len)1917 static int try_len(size_t space_left, size_t orig_len,
1918                    size_t base_hdr_len, size_t lenbytes,
1919                    uint64_t maxn, size_t *hdr_len, size_t *payload_len)
1920 {
1921     size_t n;
1922     size_t maxn_ = maxn > SIZE_MAX ? SIZE_MAX : (size_t)maxn;
1923 
1924     *hdr_len = base_hdr_len + lenbytes;
1925 
1926     if (orig_len == 0 && space_left >= *hdr_len) {
1927         *payload_len = 0;
1928         return 1;
1929     }
1930 
1931     n = orig_len;
1932     if (n > maxn_)
1933         n = maxn_;
1934     if (n + *hdr_len > space_left)
1935         n = (space_left >= *hdr_len) ? space_left - *hdr_len : 0;
1936 
1937     *payload_len = n;
1938     return n > 0;
1939 }
1940 
determine_len(size_t space_left,size_t orig_len,size_t base_hdr_len,uint64_t * hlen,uint64_t * len)1941 static int determine_len(size_t space_left, size_t orig_len,
1942                          size_t base_hdr_len,
1943                          uint64_t *hlen, uint64_t *len)
1944 {
1945     int ok = 0;
1946     size_t chosen_payload_len = 0;
1947     size_t chosen_hdr_len     = 0;
1948     size_t payload_len[4], hdr_len[4];
1949     int i, valid[4] = {0};
1950 
1951     valid[0] = try_len(space_left, orig_len, base_hdr_len,
1952                        1, OSSL_QUIC_VLINT_1B_MAX,
1953                        &hdr_len[0], &payload_len[0]);
1954     valid[1] = try_len(space_left, orig_len, base_hdr_len,
1955                        2, OSSL_QUIC_VLINT_2B_MAX,
1956                        &hdr_len[1], &payload_len[1]);
1957     valid[2] = try_len(space_left, orig_len, base_hdr_len,
1958                        4, OSSL_QUIC_VLINT_4B_MAX,
1959                        &hdr_len[2], &payload_len[2]);
1960     valid[3] = try_len(space_left, orig_len, base_hdr_len,
1961                        8, OSSL_QUIC_VLINT_8B_MAX,
1962                        &hdr_len[3], &payload_len[3]);
1963 
1964    for (i = OSSL_NELEM(valid) - 1; i >= 0; --i)
1965         if (valid[i] && payload_len[i] >= chosen_payload_len) {
1966             chosen_payload_len = payload_len[i];
1967             chosen_hdr_len     = hdr_len[i];
1968             ok                 = 1;
1969         }
1970 
1971     *hlen = chosen_hdr_len;
1972     *len  = chosen_payload_len;
1973     return ok;
1974 }
1975 
1976 /*
1977  * Given a CRYPTO frame header with accurate chdr->len and a budget
1978  * (space_left), try to find the optimal value of chdr->len to fill as much of
1979  * the budget as possible. This is slightly hairy because larger values of
1980  * chdr->len cause larger encoded sizes of the length field of the frame, which
1981  * in turn mean less space available for payload data. We check all possible
1982  * encodings and choose the optimal encoding.
1983  */
determine_crypto_len(struct tx_helper * h,OSSL_QUIC_FRAME_CRYPTO * chdr,size_t space_left,uint64_t * hlen,uint64_t * len)1984 static int determine_crypto_len(struct tx_helper *h,
1985                                 OSSL_QUIC_FRAME_CRYPTO *chdr,
1986                                 size_t space_left,
1987                                 uint64_t *hlen,
1988                                 uint64_t *len)
1989 {
1990     size_t orig_len;
1991     size_t base_hdr_len; /* CRYPTO header length without length field */
1992 
1993     if (chdr->len > SIZE_MAX)
1994         return 0;
1995 
1996     orig_len = (size_t)chdr->len;
1997 
1998     chdr->len = 0;
1999     base_hdr_len = ossl_quic_wire_get_encoded_frame_len_crypto_hdr(chdr);
2000     chdr->len = orig_len;
2001     if (base_hdr_len == 0)
2002         return 0;
2003 
2004     --base_hdr_len;
2005 
2006     return determine_len(space_left, orig_len, base_hdr_len, hlen, len);
2007 }
2008 
determine_stream_len(struct tx_helper * h,OSSL_QUIC_FRAME_STREAM * shdr,size_t space_left,uint64_t * hlen,uint64_t * len)2009 static int determine_stream_len(struct tx_helper *h,
2010                                 OSSL_QUIC_FRAME_STREAM *shdr,
2011                                 size_t space_left,
2012                                 uint64_t *hlen,
2013                                 uint64_t *len)
2014 {
2015     size_t orig_len;
2016     size_t base_hdr_len; /* STREAM header length without length field */
2017 
2018     if (shdr->len > SIZE_MAX)
2019         return 0;
2020 
2021     orig_len = (size_t)shdr->len;
2022 
2023     shdr->len = 0;
2024     base_hdr_len = ossl_quic_wire_get_encoded_frame_len_stream_hdr(shdr);
2025     shdr->len = orig_len;
2026     if (base_hdr_len == 0)
2027         return 0;
2028 
2029     if (shdr->has_explicit_len)
2030         --base_hdr_len;
2031 
2032     return determine_len(space_left, orig_len, base_hdr_len, hlen, len);
2033 }
2034 
txp_generate_crypto_frames(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,int * have_ack_eliciting)2035 static int txp_generate_crypto_frames(OSSL_QUIC_TX_PACKETISER *txp,
2036                                       struct txp_pkt *pkt,
2037                                       int *have_ack_eliciting)
2038 {
2039     const uint32_t enc_level = pkt->h.enc_level;
2040     const uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
2041     QUIC_TXPIM_PKT *tpkt = pkt->tpkt;
2042     struct tx_helper *h = &pkt->h;
2043     size_t num_stream_iovec;
2044     OSSL_QUIC_FRAME_STREAM shdr = {0};
2045     OSSL_QUIC_FRAME_CRYPTO chdr = {0};
2046     OSSL_QTX_IOVEC iov[2];
2047     uint64_t hdr_bytes;
2048     WPACKET *wpkt;
2049     QUIC_TXPIM_CHUNK chunk = {0};
2050     size_t i, space_left;
2051 
2052     for (i = 0;; ++i) {
2053         space_left = tx_helper_get_space_left(h);
2054 
2055         if (space_left < MIN_FRAME_SIZE_CRYPTO)
2056             return 1; /* no point trying */
2057 
2058         /* Do we have any CRYPTO data waiting? */
2059         num_stream_iovec = OSSL_NELEM(iov);
2060         if (!ossl_quic_sstream_get_stream_frame(txp->args.crypto[pn_space],
2061                                                 i, &shdr, iov,
2062                                                 &num_stream_iovec))
2063             return 1; /* nothing to do */
2064 
2065         /* Convert STREAM frame header to CRYPTO frame header */
2066         chdr.offset = shdr.offset;
2067         chdr.len    = shdr.len;
2068 
2069         if (chdr.len == 0)
2070             return 1; /* nothing to do */
2071 
2072         /* Find best fit (header length, payload length) combination. */
2073         if (!determine_crypto_len(h, &chdr, space_left, &hdr_bytes,
2074                                   &chdr.len))
2075             return 1; /* can't fit anything */
2076 
2077         /*
2078          * Truncate IOVs to match our chosen length.
2079          *
2080          * The length cannot be more than SIZE_MAX because this length comes
2081          * from our send stream buffer.
2082          */
2083         ossl_quic_sstream_adjust_iov((size_t)chdr.len, iov, num_stream_iovec);
2084 
2085         /*
2086          * Ensure we have enough iovecs allocated (1 for the header, up to 2 for
2087          * the stream data.)
2088          */
2089         if (!txp_el_ensure_iovec(&txp->el[enc_level], h->num_iovec + 3))
2090             return 0; /* alloc error */
2091 
2092         /* Encode the header. */
2093         wpkt = tx_helper_begin(h);
2094         if (wpkt == NULL)
2095             return 0; /* alloc error */
2096 
2097         if (!ossl_quic_wire_encode_frame_crypto_hdr(wpkt, &chdr)) {
2098             tx_helper_rollback(h);
2099             return 1; /* can't fit */
2100         }
2101 
2102         if (!tx_helper_commit(h))
2103             return 0; /* alloc error */
2104 
2105         /* Add payload iovecs to the helper (infallible). */
2106         for (i = 0; i < num_stream_iovec; ++i)
2107             tx_helper_append_iovec(h, iov[i].buf, iov[i].buf_len);
2108 
2109         *have_ack_eliciting = 1;
2110         tx_helper_unrestrict(h); /* no longer need PING */
2111 
2112         /* Log chunk to TXPIM. */
2113         chunk.stream_id = UINT64_MAX; /* crypto stream */
2114         chunk.start     = chdr.offset;
2115         chunk.end       = chdr.offset + chdr.len - 1;
2116         chunk.has_fin   = 0; /* Crypto stream never ends */
2117         if (!ossl_quic_txpim_pkt_append_chunk(tpkt, &chunk))
2118             return 0; /* alloc error */
2119     }
2120 }
2121 
2122 struct chunk_info {
2123     OSSL_QUIC_FRAME_STREAM shdr;
2124     uint64_t orig_len;
2125     OSSL_QTX_IOVEC iov[2];
2126     size_t num_stream_iovec;
2127     int valid;
2128 };
2129 
txp_plan_stream_chunk(OSSL_QUIC_TX_PACKETISER * txp,struct tx_helper * h,QUIC_SSTREAM * sstream,QUIC_TXFC * stream_txfc,size_t skip,struct chunk_info * chunk,uint64_t consumed)2130 static int txp_plan_stream_chunk(OSSL_QUIC_TX_PACKETISER *txp,
2131                                  struct tx_helper *h,
2132                                  QUIC_SSTREAM *sstream,
2133                                  QUIC_TXFC *stream_txfc,
2134                                  size_t skip,
2135                                  struct chunk_info *chunk,
2136                                  uint64_t consumed)
2137 {
2138     uint64_t fc_credit, fc_swm, fc_limit;
2139 
2140     chunk->num_stream_iovec = OSSL_NELEM(chunk->iov);
2141     chunk->valid = ossl_quic_sstream_get_stream_frame(sstream, skip,
2142                                                       &chunk->shdr,
2143                                                       chunk->iov,
2144                                                       &chunk->num_stream_iovec);
2145     if (!chunk->valid)
2146         return 1;
2147 
2148     if (!ossl_assert(chunk->shdr.len > 0 || chunk->shdr.is_fin))
2149         /* Should only have 0-length chunk if FIN */
2150         return 0;
2151 
2152     chunk->orig_len = chunk->shdr.len;
2153 
2154     /* Clamp according to connection and stream-level TXFC. */
2155     fc_credit   = ossl_quic_txfc_get_credit(stream_txfc, consumed);
2156     fc_swm      = ossl_quic_txfc_get_swm(stream_txfc);
2157     fc_limit    = fc_swm + fc_credit;
2158 
2159     if (chunk->shdr.len > 0 && chunk->shdr.offset + chunk->shdr.len > fc_limit) {
2160         chunk->shdr.len = (fc_limit <= chunk->shdr.offset)
2161             ? 0 : fc_limit - chunk->shdr.offset;
2162         chunk->shdr.is_fin = 0;
2163     }
2164 
2165     if (chunk->shdr.len == 0 && !chunk->shdr.is_fin) {
2166         /*
2167          * Nothing to do due to TXFC. Since SSTREAM returns chunks in ascending
2168          * order of offset we don't need to check any later chunks, so stop
2169          * iterating here.
2170          */
2171         chunk->valid = 0;
2172         return 1;
2173     }
2174 
2175     return 1;
2176 }
2177 
2178 /*
2179  * Returns 0 on fatal error (e.g. allocation failure), 1 on success.
2180  * *packet_full is set to 1 if there is no longer enough room for another STREAM
2181  * frame.
2182  */
txp_generate_stream_frames(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,uint64_t id,QUIC_SSTREAM * sstream,QUIC_TXFC * stream_txfc,QUIC_STREAM * next_stream,int * have_ack_eliciting,int * packet_full,uint64_t * new_credit_consumed,uint64_t conn_consumed)2183 static int txp_generate_stream_frames(OSSL_QUIC_TX_PACKETISER *txp,
2184                                       struct txp_pkt *pkt,
2185                                       uint64_t id,
2186                                       QUIC_SSTREAM *sstream,
2187                                       QUIC_TXFC *stream_txfc,
2188                                       QUIC_STREAM *next_stream,
2189                                       int *have_ack_eliciting,
2190                                       int *packet_full,
2191                                       uint64_t *new_credit_consumed,
2192                                       uint64_t conn_consumed)
2193 {
2194     int rc = 0;
2195     struct chunk_info chunks[2] = {0};
2196     const uint32_t enc_level = pkt->h.enc_level;
2197     QUIC_TXPIM_PKT *tpkt = pkt->tpkt;
2198     struct tx_helper *h = &pkt->h;
2199     OSSL_QUIC_FRAME_STREAM *shdr;
2200     WPACKET *wpkt;
2201     QUIC_TXPIM_CHUNK chunk;
2202     size_t i, j, space_left;
2203     int can_fill_payload, use_explicit_len;
2204     int could_have_following_chunk;
2205     uint64_t orig_len;
2206     uint64_t hdr_len_implicit, payload_len_implicit;
2207     uint64_t hdr_len_explicit, payload_len_explicit;
2208     uint64_t fc_swm, fc_new_hwm;
2209 
2210     fc_swm      = ossl_quic_txfc_get_swm(stream_txfc);
2211     fc_new_hwm  = fc_swm;
2212 
2213     /*
2214      * Load the first two chunks if any offered by the send stream. We retrieve
2215      * the next chunk in advance so we can determine if we need to send any more
2216      * chunks from the same stream after this one, which is needed when
2217      * determining when we can use an implicit length in a STREAM frame.
2218      */
2219     for (i = 0; i < 2; ++i) {
2220         if (!txp_plan_stream_chunk(txp, h, sstream, stream_txfc, i, &chunks[i],
2221                                    conn_consumed))
2222             goto err;
2223 
2224         if (i == 0 && !chunks[i].valid) {
2225             /* No chunks, nothing to do. */
2226             rc = 1;
2227             goto err;
2228         }
2229     }
2230 
2231     for (i = 0;; ++i) {
2232         space_left = tx_helper_get_space_left(h);
2233 
2234         if (!chunks[i % 2].valid) {
2235             /* Out of chunks; we're done. */
2236             rc = 1;
2237             goto err;
2238         }
2239 
2240         if (space_left < MIN_FRAME_SIZE_STREAM) {
2241             *packet_full = 1;
2242             rc = 1;
2243             goto err;
2244         }
2245 
2246         if (!ossl_assert(!h->done_implicit))
2247             /*
2248              * Logic below should have ensured we didn't append an
2249              * implicit-length unless we filled the packet or didn't have
2250              * another stream to handle, so this should not be possible.
2251              */
2252             goto err;
2253 
2254         shdr = &chunks[i % 2].shdr;
2255         orig_len = chunks[i % 2].orig_len;
2256         if (i > 0)
2257             /* Load next chunk for lookahead. */
2258             if (!txp_plan_stream_chunk(txp, h, sstream, stream_txfc, i + 1,
2259                                        &chunks[(i + 1) % 2], conn_consumed))
2260                 goto err;
2261 
2262         /*
2263          * Find best fit (header length, payload length) combination for if we
2264          * use an implicit length.
2265          */
2266         shdr->has_explicit_len = 0;
2267         hdr_len_implicit = payload_len_implicit = 0;
2268         if (!determine_stream_len(h, shdr, space_left,
2269                                   &hdr_len_implicit, &payload_len_implicit)) {
2270             *packet_full = 1;
2271             rc = 1;
2272             goto err; /* can't fit anything */
2273         }
2274 
2275         /*
2276          * If there is a next stream, we don't use the implicit length so we can
2277          * add more STREAM frames after this one, unless there is enough data
2278          * for this STREAM frame to fill the packet.
2279          */
2280         can_fill_payload = (hdr_len_implicit + payload_len_implicit
2281                             >= space_left);
2282 
2283         /*
2284          * Is there is a stream after this one, or another chunk pending
2285          * transmission in this stream?
2286          */
2287         could_have_following_chunk
2288             = (next_stream != NULL || chunks[(i + 1) % 2].valid);
2289 
2290         /* Choose between explicit or implicit length representations. */
2291         use_explicit_len = !((can_fill_payload || !could_have_following_chunk)
2292                              && !pkt->force_pad);
2293 
2294         if (use_explicit_len) {
2295             /*
2296              * Find best fit (header length, payload length) combination for if
2297              * we use an explicit length.
2298              */
2299             shdr->has_explicit_len = 1;
2300             hdr_len_explicit = payload_len_explicit = 0;
2301             if (!determine_stream_len(h, shdr, space_left,
2302                                       &hdr_len_explicit, &payload_len_explicit)) {
2303                 *packet_full = 1;
2304                 rc = 1;
2305                 goto err; /* can't fit anything */
2306             }
2307 
2308             shdr->len = payload_len_explicit;
2309         } else {
2310             *packet_full = 1;
2311             shdr->has_explicit_len = 0;
2312             shdr->len = payload_len_implicit;
2313         }
2314 
2315         /* If this is a FIN, don't keep filling the packet with more FINs. */
2316         if (shdr->is_fin)
2317             chunks[(i + 1) % 2].valid = 0;
2318 
2319         /*
2320          * We are now committed to our length (shdr->len can't change).
2321          * If we truncated the chunk, clear the FIN bit.
2322          */
2323         if (shdr->len < orig_len)
2324             shdr->is_fin = 0;
2325 
2326         /* Truncate IOVs to match our chosen length. */
2327         ossl_quic_sstream_adjust_iov((size_t)shdr->len, chunks[i % 2].iov,
2328                                      chunks[i % 2].num_stream_iovec);
2329 
2330         /*
2331          * Ensure we have enough iovecs allocated (1 for the header, up to 2 for
2332          * the stream data.)
2333          */
2334         if (!txp_el_ensure_iovec(&txp->el[enc_level], h->num_iovec + 3))
2335             goto err; /* alloc error */
2336 
2337         /* Encode the header. */
2338         wpkt = tx_helper_begin(h);
2339         if (wpkt == NULL)
2340             goto err; /* alloc error */
2341 
2342         shdr->stream_id = id;
2343         if (!ossl_assert(ossl_quic_wire_encode_frame_stream_hdr(wpkt, shdr))) {
2344             /* (Should not be possible.) */
2345             tx_helper_rollback(h);
2346             *packet_full = 1;
2347             rc = 1;
2348             goto err; /* can't fit */
2349         }
2350 
2351         if (!tx_helper_commit(h))
2352             goto err; /* alloc error */
2353 
2354         /* Add payload iovecs to the helper (infallible). */
2355         for (j = 0; j < chunks[i % 2].num_stream_iovec; ++j)
2356             tx_helper_append_iovec(h, chunks[i % 2].iov[j].buf,
2357                                    chunks[i % 2].iov[j].buf_len);
2358 
2359         *have_ack_eliciting = 1;
2360         tx_helper_unrestrict(h); /* no longer need PING */
2361         if (!shdr->has_explicit_len)
2362             h->done_implicit = 1;
2363 
2364         /* Log new TXFC credit which was consumed. */
2365         if (shdr->len > 0 && shdr->offset + shdr->len > fc_new_hwm)
2366             fc_new_hwm = shdr->offset + shdr->len;
2367 
2368         /* Log chunk to TXPIM. */
2369         chunk.stream_id         = shdr->stream_id;
2370         chunk.start             = shdr->offset;
2371         chunk.end               = shdr->offset + shdr->len - 1;
2372         chunk.has_fin           = shdr->is_fin;
2373         chunk.has_stop_sending  = 0;
2374         chunk.has_reset_stream  = 0;
2375         if (!ossl_quic_txpim_pkt_append_chunk(tpkt, &chunk))
2376             goto err; /* alloc error */
2377 
2378         if (shdr->len < orig_len) {
2379             /*
2380              * If we did not serialize all of this chunk we definitely do not
2381              * want to try the next chunk
2382              */
2383             rc = 1;
2384             goto err;
2385         }
2386     }
2387 
2388 err:
2389     *new_credit_consumed = fc_new_hwm - fc_swm;
2390     return rc;
2391 }
2392 
txp_enlink_tmp(QUIC_STREAM ** tmp_head,QUIC_STREAM * stream)2393 static void txp_enlink_tmp(QUIC_STREAM **tmp_head, QUIC_STREAM *stream)
2394 {
2395     stream->txp_next = *tmp_head;
2396     *tmp_head = stream;
2397 }
2398 
txp_generate_stream_related(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,int * have_ack_eliciting,QUIC_STREAM ** tmp_head)2399 static int txp_generate_stream_related(OSSL_QUIC_TX_PACKETISER *txp,
2400                                        struct txp_pkt *pkt,
2401                                        int *have_ack_eliciting,
2402                                        QUIC_STREAM **tmp_head)
2403 {
2404     QUIC_STREAM_ITER it;
2405     WPACKET *wpkt;
2406     uint64_t cwm;
2407     QUIC_STREAM *stream, *snext;
2408     struct tx_helper *h = &pkt->h;
2409     uint64_t conn_consumed = 0;
2410 
2411     for (ossl_quic_stream_iter_init(&it, txp->args.qsm, 1);
2412          it.stream != NULL;) {
2413 
2414         stream = it.stream;
2415         ossl_quic_stream_iter_next(&it);
2416         snext = it.stream;
2417 
2418         stream->txp_sent_fc                  = 0;
2419         stream->txp_sent_stop_sending        = 0;
2420         stream->txp_sent_reset_stream        = 0;
2421         stream->txp_blocked                  = 0;
2422         stream->txp_txfc_new_credit_consumed = 0;
2423 
2424         /* Stream Abort Frames (STOP_SENDING, RESET_STREAM) */
2425         if (stream->want_stop_sending) {
2426             OSSL_QUIC_FRAME_STOP_SENDING f;
2427 
2428             wpkt = tx_helper_begin(h);
2429             if (wpkt == NULL)
2430                 return 0; /* alloc error */
2431 
2432             f.stream_id         = stream->id;
2433             f.app_error_code    = stream->stop_sending_aec;
2434             if (!ossl_quic_wire_encode_frame_stop_sending(wpkt, &f)) {
2435                 tx_helper_rollback(h); /* can't fit */
2436                 txp_enlink_tmp(tmp_head, stream);
2437                 break;
2438             }
2439 
2440             if (!tx_helper_commit(h))
2441                 return 0; /* alloc error */
2442 
2443             *have_ack_eliciting = 1;
2444             tx_helper_unrestrict(h); /* no longer need PING */
2445             stream->txp_sent_stop_sending = 1;
2446         }
2447 
2448         if (stream->want_reset_stream) {
2449             OSSL_QUIC_FRAME_RESET_STREAM f;
2450 
2451             if (!ossl_assert(stream->send_state == QUIC_SSTREAM_STATE_RESET_SENT))
2452                 return 0;
2453 
2454             wpkt = tx_helper_begin(h);
2455             if (wpkt == NULL)
2456                 return 0; /* alloc error */
2457 
2458             f.stream_id         = stream->id;
2459             f.app_error_code    = stream->reset_stream_aec;
2460             if (!ossl_quic_stream_send_get_final_size(stream, &f.final_size))
2461                 return 0; /* should not be possible */
2462 
2463             if (!ossl_quic_wire_encode_frame_reset_stream(wpkt, &f)) {
2464                 tx_helper_rollback(h); /* can't fit */
2465                 txp_enlink_tmp(tmp_head, stream);
2466                 break;
2467             }
2468 
2469             if (!tx_helper_commit(h))
2470                 return 0; /* alloc error */
2471 
2472             *have_ack_eliciting = 1;
2473             tx_helper_unrestrict(h); /* no longer need PING */
2474             stream->txp_sent_reset_stream = 1;
2475 
2476             /*
2477              * The final size of the stream as indicated by RESET_STREAM is used
2478              * to ensure a consistent view of flow control state by both
2479              * parties; if we happen to send a RESET_STREAM that consumes more
2480              * flow control credit, make sure we account for that.
2481              */
2482             if (!ossl_assert(f.final_size <= ossl_quic_txfc_get_swm(&stream->txfc)))
2483                 return 0;
2484 
2485             stream->txp_txfc_new_credit_consumed
2486                 = f.final_size - ossl_quic_txfc_get_swm(&stream->txfc);
2487         }
2488 
2489         /*
2490          * Stream Flow Control Frames (MAX_STREAM_DATA)
2491          *
2492          * RFC 9000 s. 13.3: "An endpoint SHOULD stop sending MAX_STREAM_DATA
2493          * frames when the receiving part of the stream enters a "Size Known" or
2494          * "Reset Recvd" state." -- In practice, RECV is the only state
2495          * in which it makes sense to generate more MAX_STREAM_DATA frames.
2496          */
2497         if (stream->recv_state == QUIC_RSTREAM_STATE_RECV
2498             && (stream->want_max_stream_data
2499                 || ossl_quic_rxfc_has_cwm_changed(&stream->rxfc, 0))) {
2500 
2501             wpkt = tx_helper_begin(h);
2502             if (wpkt == NULL)
2503                 return 0; /* alloc error */
2504 
2505             cwm = ossl_quic_rxfc_get_cwm(&stream->rxfc);
2506 
2507             if (!ossl_quic_wire_encode_frame_max_stream_data(wpkt, stream->id,
2508                                                              cwm)) {
2509                 tx_helper_rollback(h); /* can't fit */
2510                 txp_enlink_tmp(tmp_head, stream);
2511                 break;
2512             }
2513 
2514             if (!tx_helper_commit(h))
2515                 return 0; /* alloc error */
2516 
2517             *have_ack_eliciting = 1;
2518             tx_helper_unrestrict(h); /* no longer need PING */
2519             stream->txp_sent_fc = 1;
2520         }
2521 
2522         /*
2523          * Stream Data Frames (STREAM)
2524          *
2525          * RFC 9000 s. 3.3: A sender MUST NOT send a STREAM [...] frame for a
2526          * stream in the "Reset Sent" state [or any terminal state]. We don't
2527          * send any more STREAM frames if we are sending, have sent, or are
2528          * planning to send, RESET_STREAM. The other terminal state is Data
2529          * Recvd, but txp_generate_stream_frames() is guaranteed to generate
2530          * nothing in this case.
2531          */
2532         if (ossl_quic_stream_has_send_buffer(stream)
2533             && !ossl_quic_stream_send_is_reset(stream)) {
2534             int packet_full = 0;
2535 
2536             if (!ossl_assert(!stream->want_reset_stream))
2537                 return 0;
2538 
2539             if (!txp_generate_stream_frames(txp, pkt,
2540                                             stream->id, stream->sstream,
2541                                             &stream->txfc,
2542                                             snext,
2543                                             have_ack_eliciting,
2544                                             &packet_full,
2545                                             &stream->txp_txfc_new_credit_consumed,
2546                                             conn_consumed)) {
2547                 /* Fatal error (allocation, etc.) */
2548                 txp_enlink_tmp(tmp_head, stream);
2549                 return 0;
2550             }
2551             conn_consumed += stream->txp_txfc_new_credit_consumed;
2552 
2553             if (packet_full) {
2554                 txp_enlink_tmp(tmp_head, stream);
2555                 break;
2556             }
2557         }
2558 
2559         txp_enlink_tmp(tmp_head, stream);
2560     }
2561 
2562     return 1;
2563 }
2564 
txp_generate_for_el(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,int chosen_for_conn_close)2565 static int txp_generate_for_el(OSSL_QUIC_TX_PACKETISER *txp,
2566                                struct txp_pkt *pkt,
2567                                int chosen_for_conn_close)
2568 {
2569     int rc = TXP_ERR_SUCCESS;
2570     const uint32_t enc_level = pkt->h.enc_level;
2571     const uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
2572     int have_ack_eliciting = 0, done_pre_token = 0;
2573     const struct archetype_data a = pkt->geom.adata;
2574     /*
2575      * Cleared if we encode any non-ACK-eliciting frame type which rules out the
2576      * packet being a non-inflight frame. This means any non-ACK ACK-eliciting
2577      * frame, even PADDING frames. ACK eliciting frames always cause a packet to
2578      * become ineligible for non-inflight treatment so it is not necessary to
2579      * clear this in cases where have_ack_eliciting is set, as it is ignored in
2580      * that case.
2581      */
2582     int can_be_non_inflight = 1;
2583     QUIC_CFQ_ITEM *cfq_item;
2584     QUIC_TXPIM_PKT *tpkt = NULL;
2585     struct tx_helper *h = &pkt->h;
2586 
2587     /* Maximum PN reached? */
2588     if (!ossl_quic_pn_valid(txp->next_pn[pn_space]))
2589         goto fatal_err;
2590 
2591     if (!ossl_assert(pkt->tpkt == NULL))
2592         goto fatal_err;
2593 
2594     if ((pkt->tpkt = tpkt = ossl_quic_txpim_pkt_alloc(txp->args.txpim)) == NULL)
2595         goto fatal_err;
2596 
2597     /*
2598      * Frame Serialization
2599      * ===================
2600      *
2601      * We now serialize frames into the packet in descending order of priority.
2602      */
2603 
2604     /* HANDSHAKE_DONE (Regenerate) */
2605     if (a.allow_handshake_done && txp->want_handshake_done
2606         && tx_helper_get_space_left(h) >= MIN_FRAME_SIZE_HANDSHAKE_DONE) {
2607         WPACKET *wpkt = tx_helper_begin(h);
2608 
2609         if (wpkt == NULL)
2610             goto fatal_err;
2611 
2612         if (ossl_quic_wire_encode_frame_handshake_done(wpkt)) {
2613             tpkt->had_handshake_done_frame = 1;
2614             have_ack_eliciting             = 1;
2615 
2616             if (!tx_helper_commit(h))
2617                 goto fatal_err;
2618 
2619             tx_helper_unrestrict(h); /* no longer need PING */
2620         } else {
2621             tx_helper_rollback(h);
2622         }
2623     }
2624 
2625     /* MAX_DATA (Regenerate) */
2626     if (a.allow_conn_fc
2627         && (txp->want_max_data
2628             || ossl_quic_rxfc_has_cwm_changed(txp->args.conn_rxfc, 0))
2629         && tx_helper_get_space_left(h) >= MIN_FRAME_SIZE_MAX_DATA) {
2630         WPACKET *wpkt = tx_helper_begin(h);
2631         uint64_t cwm = ossl_quic_rxfc_get_cwm(txp->args.conn_rxfc);
2632 
2633         if (wpkt == NULL)
2634             goto fatal_err;
2635 
2636         if (ossl_quic_wire_encode_frame_max_data(wpkt, cwm)) {
2637             tpkt->had_max_data_frame = 1;
2638             have_ack_eliciting       = 1;
2639 
2640             if (!tx_helper_commit(h))
2641                 goto fatal_err;
2642 
2643             tx_helper_unrestrict(h); /* no longer need PING */
2644         } else {
2645             tx_helper_rollback(h);
2646         }
2647     }
2648 
2649     /* MAX_STREAMS_BIDI (Regenerate) */
2650     if (a.allow_conn_fc
2651         && (txp->want_max_streams_bidi
2652             || ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_bidi_rxfc, 0))
2653         && tx_helper_get_space_left(h) >= MIN_FRAME_SIZE_MAX_STREAMS_BIDI) {
2654         WPACKET *wpkt = tx_helper_begin(h);
2655         uint64_t max_streams
2656             = ossl_quic_rxfc_get_cwm(txp->args.max_streams_bidi_rxfc);
2657 
2658         if (wpkt == NULL)
2659             goto fatal_err;
2660 
2661         if (ossl_quic_wire_encode_frame_max_streams(wpkt, /*is_uni=*/0,
2662                                                     max_streams)) {
2663             tpkt->had_max_streams_bidi_frame = 1;
2664             have_ack_eliciting               = 1;
2665 
2666             if (!tx_helper_commit(h))
2667                 goto fatal_err;
2668 
2669             tx_helper_unrestrict(h); /* no longer need PING */
2670         } else {
2671             tx_helper_rollback(h);
2672         }
2673     }
2674 
2675     /* MAX_STREAMS_UNI (Regenerate) */
2676     if (a.allow_conn_fc
2677         && (txp->want_max_streams_uni
2678             || ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_uni_rxfc, 0))
2679         && tx_helper_get_space_left(h) >= MIN_FRAME_SIZE_MAX_STREAMS_UNI) {
2680         WPACKET *wpkt = tx_helper_begin(h);
2681         uint64_t max_streams
2682             = ossl_quic_rxfc_get_cwm(txp->args.max_streams_uni_rxfc);
2683 
2684         if (wpkt == NULL)
2685             goto fatal_err;
2686 
2687         if (ossl_quic_wire_encode_frame_max_streams(wpkt, /*is_uni=*/1,
2688                                                     max_streams)) {
2689             tpkt->had_max_streams_uni_frame = 1;
2690             have_ack_eliciting              = 1;
2691 
2692             if (!tx_helper_commit(h))
2693                 goto fatal_err;
2694 
2695             tx_helper_unrestrict(h); /* no longer need PING */
2696         } else {
2697             tx_helper_rollback(h);
2698         }
2699     }
2700 
2701     /* GCR Frames */
2702     for (cfq_item = ossl_quic_cfq_get_priority_head(txp->args.cfq, pn_space);
2703          cfq_item != NULL;
2704          cfq_item = ossl_quic_cfq_item_get_priority_next(cfq_item, pn_space)) {
2705         uint64_t frame_type = ossl_quic_cfq_item_get_frame_type(cfq_item);
2706         const unsigned char *encoded = ossl_quic_cfq_item_get_encoded(cfq_item);
2707         size_t encoded_len = ossl_quic_cfq_item_get_encoded_len(cfq_item);
2708 
2709         switch (frame_type) {
2710             case OSSL_QUIC_FRAME_TYPE_NEW_CONN_ID:
2711                 if (!a.allow_new_conn_id)
2712                     continue;
2713                 break;
2714             case OSSL_QUIC_FRAME_TYPE_RETIRE_CONN_ID:
2715                 if (!a.allow_retire_conn_id)
2716                     continue;
2717                 break;
2718             case OSSL_QUIC_FRAME_TYPE_NEW_TOKEN:
2719                 if (!a.allow_new_token)
2720                     continue;
2721 
2722                 /*
2723                  * NEW_TOKEN frames are handled via GCR, but some
2724                  * Regenerate-strategy frames should come before them (namely
2725                  * ACK, CONNECTION_CLOSE, PATH_CHALLENGE and PATH_RESPONSE). If
2726                  * we find a NEW_TOKEN frame, do these now. If there are no
2727                  * NEW_TOKEN frames in the GCR queue we will handle these below.
2728                  */
2729                 if (!done_pre_token)
2730                     if (txp_generate_pre_token(txp, pkt,
2731                                                chosen_for_conn_close,
2732                                                &can_be_non_inflight))
2733                         done_pre_token = 1;
2734 
2735                 break;
2736             case OSSL_QUIC_FRAME_TYPE_PATH_RESPONSE:
2737                 if (!a.allow_path_response)
2738                     continue;
2739 
2740                 /*
2741                  * RFC 9000 s. 8.2.2: An endpoint MUST expand datagrams that
2742                  * contain a PATH_RESPONSE frame to at least the smallest
2743                  * allowed maximum datagram size of 1200 bytes.
2744                  */
2745                 pkt->force_pad = 1;
2746                 break;
2747             default:
2748                 if (!a.allow_cfq_other)
2749                     continue;
2750                 break;
2751         }
2752 
2753         /*
2754          * If the frame is too big, don't try to schedule any more GCR frames in
2755          * this packet rather than sending subsequent ones out of order.
2756          */
2757         if (encoded_len > tx_helper_get_space_left(h))
2758             break;
2759 
2760         if (!tx_helper_append_iovec(h, encoded, encoded_len))
2761             goto fatal_err;
2762 
2763         ossl_quic_txpim_pkt_add_cfq_item(tpkt, cfq_item);
2764 
2765         if (ossl_quic_frame_type_is_ack_eliciting(frame_type)) {
2766             have_ack_eliciting = 1;
2767             tx_helper_unrestrict(h); /* no longer need PING */
2768         }
2769     }
2770 
2771     /*
2772      * If we didn't generate ACK, CONNECTION_CLOSE, PATH_CHALLENGE or
2773      * PATH_RESPONSE (as desired) before, do so now.
2774      */
2775     if (!done_pre_token)
2776         if (txp_generate_pre_token(txp, pkt,
2777                                    chosen_for_conn_close,
2778                                    &can_be_non_inflight))
2779             done_pre_token = 1;
2780 
2781     /* CRYPTO Frames */
2782     if (a.allow_crypto)
2783         if (!txp_generate_crypto_frames(txp, pkt, &have_ack_eliciting))
2784             goto fatal_err;
2785 
2786     /* Stream-specific frames */
2787     if (a.allow_stream_rel && txp->handshake_complete)
2788         if (!txp_generate_stream_related(txp, pkt,
2789                                          &have_ack_eliciting,
2790                                          &pkt->stream_head))
2791             goto fatal_err;
2792 
2793     /* PING */
2794     tx_helper_unrestrict(h);
2795 
2796     if (!have_ack_eliciting && txp_need_ping(txp, pn_space, &a)) {
2797         WPACKET *wpkt;
2798 
2799         assert(h->reserve > 0);
2800         wpkt = tx_helper_begin(h);
2801         if (wpkt == NULL)
2802             goto fatal_err;
2803 
2804         if (!ossl_quic_wire_encode_frame_ping(wpkt)
2805             || !tx_helper_commit(h))
2806             /*
2807              * We treat a request to be ACK-eliciting as a requirement, so this
2808              * is an error.
2809              */
2810             goto fatal_err;
2811 
2812         have_ack_eliciting = 1;
2813     }
2814 
2815     /* PADDING is added by ossl_quic_tx_packetiser_generate(). */
2816 
2817     /*
2818      * ACKM Data
2819      * =========
2820      */
2821     if (have_ack_eliciting)
2822         can_be_non_inflight = 0;
2823 
2824     /* ACKM Data */
2825     tpkt->ackm_pkt.num_bytes        = h->bytes_appended + pkt->geom.pkt_overhead;
2826     tpkt->ackm_pkt.pkt_num          = txp->next_pn[pn_space];
2827     /* largest_acked is set in txp_generate_pre_token */
2828     tpkt->ackm_pkt.pkt_space        = pn_space;
2829     tpkt->ackm_pkt.is_inflight      = !can_be_non_inflight;
2830     tpkt->ackm_pkt.is_ack_eliciting = have_ack_eliciting;
2831     tpkt->ackm_pkt.is_pto_probe     = 0;
2832     tpkt->ackm_pkt.is_mtu_probe     = 0;
2833     tpkt->ackm_pkt.time             = txp->args.now(txp->args.now_arg);
2834     tpkt->pkt_type                  = pkt->phdr.type;
2835 
2836     /* Done. */
2837     return rc;
2838 
2839 fatal_err:
2840     /*
2841      * Handler for fatal errors, i.e. errors causing us to abort the entire
2842      * packet rather than just one frame. Examples of such errors include
2843      * allocation errors.
2844      */
2845     if (tpkt != NULL) {
2846         ossl_quic_txpim_pkt_release(txp->args.txpim, tpkt);
2847         pkt->tpkt = NULL;
2848     }
2849     return TXP_ERR_INTERNAL;
2850 }
2851 
2852 /*
2853  * Commits and queues a packet for transmission. There is no backing out after
2854  * this.
2855  *
2856  * This:
2857  *
2858  *   - Sends the packet to the QTX for encryption and transmission;
2859  *
2860  *   - Records the packet as having been transmitted in FIFM. ACKM is informed,
2861  *     etc. and the TXPIM record is filed.
2862  *
2863  *   - Informs various subsystems of frames that were sent and clears frame
2864  *     wanted flags so that we do not generate the same frames again.
2865  *
2866  * Assumptions:
2867  *
2868  *   - pkt is a txp_pkt for the correct EL;
2869  *
2870  *   - pkt->tpkt is valid;
2871  *
2872  *   - pkt->tpkt->ackm_pkt has been fully filled in;
2873  *
2874  *   - Stream chunk records have been appended to pkt->tpkt for STREAM and
2875  *     CRYPTO frames, but not for RESET_STREAM or STOP_SENDING frames;
2876  *
2877  *   - The chosen stream list for the packet can be fully walked from
2878  *     pkt->stream_head using stream->txp_next;
2879  *
2880  *   - pkt->has_ack_eliciting is set correctly.
2881  *
2882  */
txp_pkt_commit(OSSL_QUIC_TX_PACKETISER * txp,struct txp_pkt * pkt,uint32_t archetype,int * txpim_pkt_reffed)2883 static int txp_pkt_commit(OSSL_QUIC_TX_PACKETISER *txp,
2884                           struct txp_pkt *pkt,
2885                           uint32_t archetype,
2886                           int *txpim_pkt_reffed)
2887 {
2888     int rc = 1;
2889     uint32_t enc_level = pkt->h.enc_level;
2890     uint32_t pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
2891     QUIC_TXPIM_PKT *tpkt = pkt->tpkt;
2892     QUIC_STREAM *stream;
2893     OSSL_QTX_PKT txpkt;
2894     struct archetype_data a;
2895 
2896     *txpim_pkt_reffed = 0;
2897 
2898     /* Cannot send a packet with an empty payload. */
2899     if (pkt->h.bytes_appended == 0)
2900         return 0;
2901 
2902     if (!txp_get_archetype_data(enc_level, archetype, &a))
2903         return 0;
2904 
2905     /* Packet Information for QTX */
2906     txpkt.hdr       = &pkt->phdr;
2907     txpkt.iovec     = txp->el[enc_level].iovec;
2908     txpkt.num_iovec = pkt->h.num_iovec;
2909     txpkt.local     = NULL;
2910     txpkt.peer      = BIO_ADDR_family(&txp->args.peer) == AF_UNSPEC
2911         ? NULL : &txp->args.peer;
2912     txpkt.pn        = txp->next_pn[pn_space];
2913     txpkt.flags     = OSSL_QTX_PKT_FLAG_COALESCE; /* always try to coalesce */
2914 
2915     /* Generate TXPIM chunks representing STOP_SENDING and RESET_STREAM frames. */
2916     for (stream = pkt->stream_head; stream != NULL; stream = stream->txp_next)
2917         if (stream->txp_sent_stop_sending || stream->txp_sent_reset_stream) {
2918             /* Log STOP_SENDING/RESET_STREAM chunk to TXPIM. */
2919             QUIC_TXPIM_CHUNK chunk;
2920 
2921             chunk.stream_id         = stream->id;
2922             chunk.start             = UINT64_MAX;
2923             chunk.end               = 0;
2924             chunk.has_fin           = 0;
2925             chunk.has_stop_sending  = stream->txp_sent_stop_sending;
2926             chunk.has_reset_stream  = stream->txp_sent_reset_stream;
2927             if (!ossl_quic_txpim_pkt_append_chunk(tpkt, &chunk))
2928                 return 0; /* alloc error */
2929         }
2930 
2931     /* Dispatch to FIFD. */
2932     if (!ossl_quic_fifd_pkt_commit(&txp->fifd, tpkt))
2933         return 0;
2934 
2935     /*
2936      * Transmission and Post-Packet Generation Bookkeeping
2937      * ===================================================
2938      *
2939      * No backing out anymore - at this point the ACKM has recorded the packet
2940      * as having been sent, so we need to increment our next PN counter, or
2941      * the ACKM will complain when we try to record a duplicate packet with
2942      * the same PN later. At this point actually sending the packet may still
2943      * fail. In this unlikely event it will simply be handled as though it
2944      * were a lost packet.
2945      */
2946     ++txp->next_pn[pn_space];
2947     *txpim_pkt_reffed = 1;
2948 
2949     /* Send the packet. */
2950     if (!ossl_qtx_write_pkt(txp->args.qtx, &txpkt))
2951         return 0;
2952 
2953     /*
2954      * Record FC and stream abort frames as sent; deactivate streams which no
2955      * longer have anything to do.
2956      */
2957     for (stream = pkt->stream_head; stream != NULL; stream = stream->txp_next) {
2958         if (stream->txp_sent_fc) {
2959             stream->want_max_stream_data = 0;
2960             ossl_quic_rxfc_has_cwm_changed(&stream->rxfc, 1);
2961         }
2962 
2963         if (stream->txp_sent_stop_sending)
2964             stream->want_stop_sending = 0;
2965 
2966         if (stream->txp_sent_reset_stream)
2967             stream->want_reset_stream = 0;
2968 
2969         if (stream->txp_txfc_new_credit_consumed > 0) {
2970             if (!ossl_assert(ossl_quic_txfc_consume_credit(&stream->txfc,
2971                                                            stream->txp_txfc_new_credit_consumed)))
2972                 /*
2973                  * Should not be possible, but we should continue with our
2974                  * bookkeeping as we have already committed the packet to the
2975                  * FIFD. Just change the value we return.
2976                  */
2977                 rc = 0;
2978 
2979             stream->txp_txfc_new_credit_consumed = 0;
2980         }
2981 
2982         /*
2983          * If we no longer need to generate any flow control (MAX_STREAM_DATA),
2984          * STOP_SENDING or RESET_STREAM frames, nor any STREAM frames (because
2985          * the stream is drained of data or TXFC-blocked), we can mark the
2986          * stream as inactive.
2987          */
2988         ossl_quic_stream_map_update_state(txp->args.qsm, stream);
2989 
2990         if (ossl_quic_stream_has_send_buffer(stream)
2991             && !ossl_quic_sstream_has_pending(stream->sstream)
2992             && ossl_quic_sstream_get_final_size(stream->sstream, NULL))
2993             /*
2994              * Transition to DATA_SENT if stream has a final size and we have
2995              * sent all data.
2996              */
2997             ossl_quic_stream_map_notify_all_data_sent(txp->args.qsm, stream);
2998     }
2999 
3000     /* We have now sent the packet, so update state accordingly. */
3001     if (tpkt->ackm_pkt.is_ack_eliciting)
3002         txp->force_ack_eliciting &= ~(1UL << pn_space);
3003 
3004     if (tpkt->had_handshake_done_frame)
3005         txp->want_handshake_done = 0;
3006 
3007     if (tpkt->had_max_data_frame) {
3008         txp->want_max_data = 0;
3009         ossl_quic_rxfc_has_cwm_changed(txp->args.conn_rxfc, 1);
3010     }
3011 
3012     if (tpkt->had_max_streams_bidi_frame) {
3013         txp->want_max_streams_bidi = 0;
3014         ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_bidi_rxfc, 1);
3015     }
3016 
3017     if (tpkt->had_max_streams_uni_frame) {
3018         txp->want_max_streams_uni = 0;
3019         ossl_quic_rxfc_has_cwm_changed(txp->args.max_streams_uni_rxfc, 1);
3020     }
3021 
3022     if (tpkt->had_ack_frame)
3023         txp->want_ack &= ~(1UL << pn_space);
3024 
3025     if (tpkt->had_conn_close)
3026         txp->want_conn_close = 0;
3027 
3028     /*
3029      * Decrement probe request counts if we have sent a packet that meets
3030      * the requirement of a probe, namely being ACK-eliciting.
3031      */
3032     if (tpkt->ackm_pkt.is_ack_eliciting) {
3033         OSSL_ACKM_PROBE_INFO *probe_info
3034             = ossl_ackm_get0_probe_request(txp->args.ackm);
3035 
3036         if (enc_level == QUIC_ENC_LEVEL_INITIAL
3037             && probe_info->anti_deadlock_initial > 0)
3038             --probe_info->anti_deadlock_initial;
3039 
3040         if (enc_level == QUIC_ENC_LEVEL_HANDSHAKE
3041             && probe_info->anti_deadlock_handshake > 0)
3042             --probe_info->anti_deadlock_handshake;
3043 
3044         if (a.allow_force_ack_eliciting /* (i.e., not for 0-RTT) */
3045             && probe_info->pto[pn_space] > 0)
3046             --probe_info->pto[pn_space];
3047     }
3048 
3049     return rc;
3050 }
3051 
3052 /* Ensure the iovec array is at least num elements long. */
txp_el_ensure_iovec(struct txp_el * el,size_t num)3053 static int txp_el_ensure_iovec(struct txp_el *el, size_t num)
3054 {
3055     OSSL_QTX_IOVEC *iovec;
3056 
3057     if (el->alloc_iovec >= num)
3058         return 1;
3059 
3060     num = el->alloc_iovec != 0 ? el->alloc_iovec * 2 : 8;
3061 
3062     iovec = OPENSSL_realloc(el->iovec, sizeof(OSSL_QTX_IOVEC) * num);
3063     if (iovec == NULL)
3064         return 0;
3065 
3066     el->iovec          = iovec;
3067     el->alloc_iovec    = num;
3068     return 1;
3069 }
3070 
ossl_quic_tx_packetiser_schedule_conn_close(OSSL_QUIC_TX_PACKETISER * txp,const OSSL_QUIC_FRAME_CONN_CLOSE * f)3071 int ossl_quic_tx_packetiser_schedule_conn_close(OSSL_QUIC_TX_PACKETISER *txp,
3072                                                 const OSSL_QUIC_FRAME_CONN_CLOSE *f)
3073 {
3074     char *reason = NULL;
3075     size_t reason_len = f->reason_len;
3076     size_t max_reason_len = txp_get_mdpl(txp) / 2;
3077 
3078     if (txp->want_conn_close)
3079         return 0;
3080 
3081     /*
3082      * Arbitrarily limit the length of the reason length string to half of the
3083      * MDPL.
3084      */
3085     if (reason_len > max_reason_len)
3086         reason_len = max_reason_len;
3087 
3088     if (reason_len > 0) {
3089         reason = OPENSSL_memdup(f->reason, reason_len);
3090         if (reason == NULL)
3091             return 0;
3092     }
3093 
3094     txp->conn_close_frame               = *f;
3095     txp->conn_close_frame.reason        = reason;
3096     txp->conn_close_frame.reason_len    = reason_len;
3097     txp->want_conn_close                = 1;
3098     return 1;
3099 }
3100 
ossl_quic_tx_packetiser_set_msg_callback(OSSL_QUIC_TX_PACKETISER * txp,ossl_msg_cb msg_callback,SSL * msg_callback_ssl)3101 void ossl_quic_tx_packetiser_set_msg_callback(OSSL_QUIC_TX_PACKETISER *txp,
3102                                               ossl_msg_cb msg_callback,
3103                                               SSL *msg_callback_ssl)
3104 {
3105     txp->msg_callback = msg_callback;
3106     txp->msg_callback_ssl = msg_callback_ssl;
3107 }
3108 
ossl_quic_tx_packetiser_set_msg_callback_arg(OSSL_QUIC_TX_PACKETISER * txp,void * msg_callback_arg)3109 void ossl_quic_tx_packetiser_set_msg_callback_arg(OSSL_QUIC_TX_PACKETISER *txp,
3110                                                   void *msg_callback_arg)
3111 {
3112     txp->msg_callback_arg = msg_callback_arg;
3113 }
3114 
ossl_quic_tx_packetiser_get_next_pn(OSSL_QUIC_TX_PACKETISER * txp,uint32_t pn_space)3115 QUIC_PN ossl_quic_tx_packetiser_get_next_pn(OSSL_QUIC_TX_PACKETISER *txp,
3116                                             uint32_t pn_space)
3117 {
3118     if (pn_space >= QUIC_PN_SPACE_NUM)
3119         return UINT64_MAX;
3120 
3121     return txp->next_pn[pn_space];
3122 }
3123 
ossl_quic_tx_packetiser_get_deadline(OSSL_QUIC_TX_PACKETISER * txp)3124 OSSL_TIME ossl_quic_tx_packetiser_get_deadline(OSSL_QUIC_TX_PACKETISER *txp)
3125 {
3126     /*
3127      * TXP-specific deadline computations which rely on TXP innards. This is in
3128      * turn relied on by the QUIC_CHANNEL code to determine the channel event
3129      * handling deadline.
3130      */
3131     OSSL_TIME deadline = ossl_time_infinite();
3132     uint32_t enc_level, pn_space;
3133 
3134     /*
3135      * ACK generation is not CC-gated - packets containing only ACKs are allowed
3136      * to bypass CC. We want to generate ACK frames even if we are currently
3137      * restricted by CC so the peer knows we have received data. The generate
3138      * call will take care of selecting the correct packet archetype.
3139      */
3140     for (enc_level = QUIC_ENC_LEVEL_INITIAL;
3141          enc_level < QUIC_ENC_LEVEL_NUM;
3142          ++enc_level)
3143         if (ossl_qtx_is_enc_level_provisioned(txp->args.qtx, enc_level)) {
3144             pn_space = ossl_quic_enc_level_to_pn_space(enc_level);
3145             deadline = ossl_time_min(deadline,
3146                                      ossl_ackm_get_ack_deadline(txp->args.ackm, pn_space));
3147         }
3148 
3149     /* When will CC let us send more? */
3150     if (txp->args.cc_method->get_tx_allowance(txp->args.cc_data) == 0)
3151         deadline = ossl_time_min(deadline,
3152                                  txp->args.cc_method->get_wakeup_deadline(txp->args.cc_data));
3153 
3154     return deadline;
3155 }
3156