// Copyright 2017 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #ifndef XFA_FDE_XML_CFDE_XMLSYNTAXPARSER_H_ #define XFA_FDE_XML_CFDE_XMLSYNTAXPARSER_H_ #include #include "core/fxcrt/cfx_blockbuffer.h" #include "core/fxcrt/cfx_retain_ptr.h" #include "core/fxcrt/fx_string.h" #include "xfa/fde/xml/cfde_xmlnode.h" #include "xfa/fgas/crt/ifgas_stream.h" enum class FDE_XmlSyntaxResult { None, InstructionOpen, InstructionClose, ElementOpen, ElementBreak, ElementClose, TargetName, TagName, AttriName, AttriValue, Text, CData, TargetData, Error, EndOfString }; class CFDE_XMLSyntaxParser { public: CFDE_XMLSyntaxParser(); ~CFDE_XMLSyntaxParser(); void Init(const CFX_RetainPtr& pStream, int32_t iXMLPlaneSize, int32_t iTextDataSize = 256); FDE_XmlSyntaxResult DoSyntaxParse(); int32_t GetStatus() const; int32_t GetCurrentPos() const { return m_iParsedChars + (m_pStart - m_pBuffer); } FX_FILESIZE GetCurrentBinaryPos() const; int32_t GetCurrentNodeNumber() const { return m_iCurrentNodeNum; } int32_t GetLastNodeNumber() const { return m_iLastNodeNum; } void GetTargetName(CFX_WideString& wsTarget) const { wsTarget = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } void GetTagName(CFX_WideString& wsTag) const { wsTag = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } void GetAttributeName(CFX_WideString& wsAttriName) const { wsAttriName = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } void GetAttributeValue(CFX_WideString& wsAttriValue) const { wsAttriValue = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } void GetTextData(CFX_WideString& wsText) const { wsText = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } void GetTargetData(CFX_WideString& wsData) const { wsData = m_BlockBuffer.GetTextData(0, m_iTextDataLength); } protected: enum class FDE_XmlSyntaxState { Text, Node, Target, Tag, AttriName, AttriEqualSign, AttriQuotation, AttriValue, Entity, EntityDecimal, EntityHex, CloseInstruction, BreakElement, CloseElement, SkipDeclNode, DeclCharData, SkipComment, SkipCommentOrDecl, SkipCData, TargetData }; void ParseTextChar(wchar_t ch); CFX_RetainPtr m_pStream; int32_t m_iXMLPlaneSize; int32_t m_iCurrentPos; int32_t m_iCurrentNodeNum; int32_t m_iLastNodeNum; int32_t m_iParsedChars; int32_t m_iParsedBytes; wchar_t* m_pBuffer; int32_t m_iBufferChars; bool m_bEOS; wchar_t* m_pStart; wchar_t* m_pEnd; FDE_XMLNODE m_CurNode; std::stack m_XMLNodeStack; CFX_BlockBuffer m_BlockBuffer; int32_t m_iAllocStep; int32_t& m_iDataLength; wchar_t* m_pCurrentBlock; int32_t m_iIndexInBlock; int32_t m_iTextDataLength; FDE_XmlSyntaxResult m_syntaxParserResult; FDE_XmlSyntaxState m_syntaxParserState; wchar_t m_wQuotationMark; int32_t m_iEntityStart; std::stack m_SkipStack; wchar_t m_SkipChar; }; #endif // XFA_FDE_XML_CFDE_XMLSYNTAXPARSER_H_