mirror of
				https://github.com/LadybirdBrowser/ladybird.git
				synced 2025-10-26 18:09:45 +00:00 
			
		
		
		
	We were off-by-one when returning the result of parsing a quoted string in Web::Fetch::Infrastructure::collect_an_http_quoted_string. Instead of backtracking the lexer and consuming the backtracked string, do a simple substring operation.
		
			
				
	
	
		
			78 lines
		
	
	
	
		
			2.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			78 lines
		
	
	
	
		
			2.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2022, Luke Wilde <lukew@serenityos.org>
 | |
|  *
 | |
|  * SPDX-License-Identifier: BSD-2-Clause
 | |
|  */
 | |
| 
 | |
| #include <AK/GenericLexer.h>
 | |
| #include <AK/String.h>
 | |
| #include <AK/StringBuilder.h>
 | |
| #include <LibWeb/Fetch/Infrastructure/HTTP.h>
 | |
| 
 | |
| namespace Web::Fetch::Infrastructure {
 | |
| 
 | |
| // https://fetch.spec.whatwg.org/#collect-an-http-quoted-string
 | |
| ErrorOr<String> collect_an_http_quoted_string(GenericLexer& lexer, HttpQuotedStringExtractValue extract_value)
 | |
| {
 | |
|     // To collect an HTTP quoted string from a string input, given a position variable position and optionally an extract-value flag, run these steps:
 | |
|     // 1. Let positionStart be position.
 | |
|     auto position_start = lexer.tell();
 | |
| 
 | |
|     // 2. Let value be the empty string.
 | |
|     StringBuilder value;
 | |
| 
 | |
|     // 3. Assert: the code point at position within input is U+0022 (").
 | |
|     VERIFY(lexer.peek() == '"');
 | |
| 
 | |
|     // 4. Advance position by 1.
 | |
|     lexer.ignore(1);
 | |
| 
 | |
|     // 5. While true:
 | |
|     while (true) {
 | |
|         // 1. Append the result of collecting a sequence of code points that are not U+0022 (") or U+005C (\) from input, given position, to value.
 | |
|         auto value_part = lexer.consume_until([](char ch) {
 | |
|             return ch == '"' || ch == '\\';
 | |
|         });
 | |
| 
 | |
|         value.append(value_part);
 | |
| 
 | |
|         // 2. If position is past the end of input, then break.
 | |
|         if (lexer.is_eof())
 | |
|             break;
 | |
| 
 | |
|         // 3. Let quoteOrBackslash be the code point at position within input.
 | |
|         // 4. Advance position by 1.
 | |
|         char quote_or_backslash = lexer.consume();
 | |
| 
 | |
|         // 5. If quoteOrBackslash is U+005C (\), then:
 | |
|         if (quote_or_backslash == '\\') {
 | |
|             // 1. If position is past the end of input, then append U+005C (\) to value and break.
 | |
|             if (lexer.is_eof()) {
 | |
|                 value.append('\\');
 | |
|                 break;
 | |
|             }
 | |
| 
 | |
|             // 2. Append the code point at position within input to value.
 | |
|             // 3. Advance position by 1.
 | |
|             value.append(lexer.consume());
 | |
|         }
 | |
| 
 | |
|         // 6. Otherwise:
 | |
|         else {
 | |
|             // 1. Assert: quoteOrBackslash is U+0022 (").
 | |
|             VERIFY(quote_or_backslash == '"');
 | |
| 
 | |
|             // 2. Break.
 | |
|             break;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     // 6. If the extract-value flag is set, then return value.
 | |
|     if (extract_value == HttpQuotedStringExtractValue::Yes)
 | |
|         return value.to_string();
 | |
| 
 | |
|     // 7. Return the code points from positionStart to position, inclusive, within input.
 | |
|     return String::from_utf8(lexer.input().substring_view(position_start, lexer.tell() - position_start));
 | |
| }
 | |
| 
 | |
| }
 |