Merge Chromium + Blink git repositories
[chromium-blink-merge.git] / third_party / WebKit / Source / core / html / parser / TextResourceDecoder.h
blobc8a55813fe551c87ad38d56deaf87df9a17ba0a0
1 /*
2 Copyright (C) 1999 Lars Knoll (knoll@mpi-hd.mpg.de)
3 Copyright (C) 2006 Alexey Proskuryakov (ap@nypop.com)
4 Copyright (C) 2006, 2008 Apple Inc. All rights reserved.
6 This library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Library General Public
8 License as published by the Free Software Foundation; either
9 version 2 of the License, or (at your option) any later version.
11 This library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Library General Public License for more details.
16 You should have received a copy of the GNU Library General Public License
17 along with this library; see the file COPYING.LIB. If not, write to
18 the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
19 Boston, MA 02110-1301, USA.
23 #ifndef TextResourceDecoder_h
24 #define TextResourceDecoder_h
26 #include "core/CoreExport.h"
27 #include "wtf/RefCounted.h"
28 #include "wtf/text/TextEncoding.h"
30 namespace blink {
32 class HTMLMetaCharsetParser;
34 class CORE_EXPORT TextResourceDecoder {
35 WTF_MAKE_FAST_ALLOCATED(TextResourceDecoder);
36 WTF_MAKE_NONCOPYABLE(TextResourceDecoder);
37 public:
38 enum EncodingSource {
39 DefaultEncoding,
40 AutoDetectedEncoding,
41 EncodingFromContentSniffing,
42 EncodingFromXMLHeader,
43 EncodingFromMetaTag,
44 EncodingFromCSSCharset,
45 EncodingFromHTTPHeader,
46 EncodingFromParentFrame
49 static PassOwnPtr<TextResourceDecoder> create(const String& mimeType, const WTF::TextEncoding& defaultEncoding = WTF::TextEncoding(), bool usesEncodingDetector = false)
51 return adoptPtr(new TextResourceDecoder(mimeType, defaultEncoding, usesEncodingDetector));
53 ~TextResourceDecoder();
55 void setEncoding(const WTF::TextEncoding&, EncodingSource);
56 const WTF::TextEncoding& encoding() const { return m_encoding; }
57 bool encodingWasDetectedHeuristically() const
59 return m_source == AutoDetectedEncoding
60 || m_source == EncodingFromContentSniffing;
63 String decode(const char* data, size_t length);
64 String flush();
66 void setHintEncoding(const WTF::TextEncoding& encoding)
68 m_hintEncoding = encoding.name();
71 void useLenientXMLDecoding() { m_useLenientXMLDecoding = true; }
72 bool sawError() const { return m_sawError; }
73 size_t checkForBOM(const char*, size_t);
75 private:
76 TextResourceDecoder(const String& mimeType, const WTF::TextEncoding& defaultEncoding, bool usesEncodingDetector);
78 enum ContentType { PlainTextContent, HTMLContent, XMLContent, CSSContent }; // PlainText only checks for BOM.
79 static ContentType determineContentType(const String& mimeType);
80 static const WTF::TextEncoding& defaultEncoding(ContentType, const WTF::TextEncoding& defaultEncoding);
82 bool checkForCSSCharset(const char*, size_t, bool& movedDataToBuffer);
83 bool checkForXMLCharset(const char*, size_t, bool& movedDataToBuffer);
84 void checkForMetaCharset(const char*, size_t);
85 bool shouldAutoDetect() const;
87 ContentType m_contentType;
88 WTF::TextEncoding m_encoding;
89 OwnPtr<TextCodec> m_codec;
90 EncodingSource m_source;
91 const char* m_hintEncoding;
92 Vector<char> m_buffer;
93 bool m_checkedForBOM;
94 bool m_checkedForCSSCharset;
95 bool m_checkedForXMLCharset;
96 bool m_checkedForMetaCharset;
97 bool m_useLenientXMLDecoding; // Don't stop on XML decoding errors.
98 bool m_sawError;
99 bool m_usesEncodingDetector;
101 OwnPtr<HTMLMetaCharsetParser> m_charsetParser;
106 #endif