measurement-factory · eduard-bagdasaryan · Apr 18, 2023 · Dec 4, 2023 · Dec 6, 2023 · Dec 6, 2023
diff --git a/src/parser/BinaryTokenizer.h b/src/parser/BinaryTokenizer.h
@@ -60,6 +60,9 @@ class BinaryTokenizer
     /// this method avoids append overheads during incremental parsing
     void reinput(const SBuf &data, const bool expectMore) { data_ = data; expectMore_ = expectMore; }
 
+    /// adds more data bytes to parse
+    void append(const SBuf &data) { data_.append(data); }
+
     /// make progress: future parsing failures will not rollback beyond this point
     void commit();
 
@@ -110,6 +113,11 @@ class BinaryTokenizer
     /// debugging helper for parsed multi-field structures
     void got(uint64_t size, const char *description) const;
 
+    /// whether more data bytes may arrive in the future
+    bool expectMore() const { return expectMore_; }
-    bool expectMore() const { return expectMore_; }
+    auto expectingMore() const { return expectMore_; }
-    bool expectMore() const { return expectMore_; }
+    auto expectingMore() const { return expectMore_; }
+    /// allow or prohibit arriving more data bytes in the future
+    void expectMore(bool val) { expectMore_ = val; }
+
     const BinaryTokenizerContext *context; ///< debugging: thing being parsed
 
 protected:

diff --git a/src/security/Handshake.cc b/src/security/Handshake.cc
@@ -274,24 +274,30 @@ Security::HandshakeParser::parseModernRecord()
     Must(record.fragment.length() || record.type == ContentType::ctApplicationData);
 
     if (currentContentType != record.type) {
+        tkMessages.expectMore(false);
         parseMessages();
         Must(tkMessages.atEnd()); // no currentContentType leftovers
-        fragments = record.fragment;
         currentContentType = record.type;
-    } else {
-        fragments.append(record.fragment);
     }
 
-    if (tkRecords.atEnd() && !done)
-        parseMessages();
+    const auto haveUnparsedRecordBytes = !tkRecords.atEnd();
+    const auto expectMoreRecordLayerBytes = tkRecords.expectMore();
+    // TODO: consider adding BinaryTokenizer::exhausted() instead
+    const auto expectMoreMessageLayerBytes = haveUnparsedRecordBytes || expectMoreRecordLayerBytes;
+
+    tkMessages.expectMore(expectMoreMessageLayerBytes);
+    tkMessages.append(record.fragment);
+
+    parseMessages();
 }
 
 /// parses one or more "higher-level protocol" frames of currentContentType
 void
 Security::HandshakeParser::parseMessages()
 {
-    tkMessages.reset(fragments, false);
-    for (; !tkMessages.atEnd(); tkMessages.commit()) {
+    tkMessages.rollback();
+
+    while (!tkMessages.atEnd() && !done) {
         switch (currentContentType) {
         case ContentType::ctChangeCipherSpec:
             parseChangeCipherCpecMessage();
@@ -335,6 +341,7 @@ Security::HandshakeParser::parseAlertMessage()
 {
     Must(currentContentType == ContentType::ctAlert);
     const Alert alert(tkMessages);
+    tkMessages.commit();
     debugs(83, (alert.fatal() ? 2:3),
            "level " << static_cast<int>(alert.level) <<
            " description " << static_cast<int>(alert.description));
@@ -349,6 +356,7 @@ Security::HandshakeParser::parseHandshakeMessage()
     Must(currentContentType == ContentType::ctHandshake);
 
     const Handshake message(tkMessages);
+    tkMessages.commit();
 
     switch (message.msg_type) {
     case HandshakeType::hskClientHello:
@@ -631,10 +639,11 @@ Security::HandshakeParser::parseSupportedVersionsExtension(const SBuf &extension
 void
 Security::HandshakeParser::skipMessage(const char *description)
 {
-    // tkMessages/fragments can only contain messages of the same ContentType.
+    // tkMessages can only contain messages of the same ContentType.
     // To skip a message, we can and should skip everything we have [left]. If
     // we have partial messages, debugging will mislead about their boundaries.
-    // we have partial messages, debugging will mislead about their boundaries.
+    // we buffered a partial message, we will need to read/skip multiple times.
-    // we have partial messages, debugging will mislead about their boundaries.
+    // we buffered a partial message, we will need to read/skip multiple times.
     tkMessages.skip(tkMessages.leftovers().length(), description);
+    tkMessages.commit();
 }
 
 bool

diff --git a/src/security/Handshake.h b/src/security/Handshake.h
@@ -115,9 +115,6 @@ class HandshakeParser
 
     const char *done; ///< not nil if we got what we were looking for
 
-    /// concatenated TLSPlaintext.fragments of TLSPlaintext.type
-    SBuf fragments;
-
     /// TLS record layer (parsing uninterpreted data)
     Parser::BinaryTokenizer tkRecords;