mirror of
				https://github.com/RGBCube/serenity
				synced 2025-10-26 00:12:33 +00:00 
			
		
		
		
	 6a95df2526
			
		
	
	
		6a95df2526
		
	
	
	
	
		
			
			This ripples down to LibWeb's HTML and XHR decoders, which therefore become less allocation heavy.
		
			
				
	
	
		
			92 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			92 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2020-2021, Andreas Kling <kling@serenityos.org>
 | |
|  * Copyright (c) 2022, Jelle Raaijmakers <jelle@gmta.nl>
 | |
|  *
 | |
|  * SPDX-License-Identifier: BSD-2-Clause
 | |
|  */
 | |
| 
 | |
| #pragma once
 | |
| 
 | |
| #include <AK/Forward.h>
 | |
| #include <AK/Function.h>
 | |
| 
 | |
| namespace TextCodec {
 | |
| 
 | |
| class Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) = 0;
 | |
|     virtual String to_utf8(StringView);
 | |
| 
 | |
| protected:
 | |
|     virtual ~Decoder() = default;
 | |
| };
 | |
| 
 | |
| class UTF8Decoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
|     virtual String to_utf8(StringView) override;
 | |
| };
 | |
| 
 | |
| class UTF16BEDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
|     virtual String to_utf8(StringView) override;
 | |
| };
 | |
| 
 | |
| class UTF16LEDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
|     virtual String to_utf8(StringView) override;
 | |
| };
 | |
| 
 | |
| class Latin1Decoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class Latin2Decoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class HebrewDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class CyrillicDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class Koi8RDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class Latin9Decoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class TurkishDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| class XUserDefinedDecoder final : public Decoder {
 | |
| public:
 | |
|     virtual void process(StringView, Function<void(u32)> on_code_point) override;
 | |
| };
 | |
| 
 | |
| Decoder* decoder_for(String const& encoding);
 | |
| Optional<StringView> get_standardized_encoding(StringView encoding);
 | |
| 
 | |
| // This returns the appropriate Unicode decoder for the sniffed BOM or nullptr if there is no appropriate decoder.
 | |
| Decoder* bom_sniff_to_decoder(StringView);
 | |
| 
 | |
| // NOTE: This has an obnoxious name to discourage usage. Only use this if you absolutely must! For example, XHR in LibWeb uses this.
 | |
| // This will use the given decoder unless there is a byte order mark in the input, in which we will instead use the appropriate Unicode decoder.
 | |
| String convert_input_to_utf8_using_given_decoder_unless_there_is_a_byte_order_mark(Decoder&, StringView);
 | |
| 
 | |
| }
 |