// Copyright 2014 PDFium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#ifndef _FXCRT_XML_INT_
#define _FXCRT_XML_INT_
class CXML_DataBufAcc : public IFX_BufferRead, public CFX_Object
{
public:
CXML_DataBufAcc(FX_LPCBYTE pBuffer, size_t size, IFX_Allocator* pAllocator = NULL)
: m_pAllocator(pAllocator)
, m_pBuffer(pBuffer)
, m_dwSize(size)
, m_dwCurPos(0)
{
}
virtual ~CXML_DataBufAcc() {}
virtual void Release()
{
if (m_pAllocator) {
FX_DeleteAtAllocator(this, m_pAllocator, CXML_DataBufAcc);
} else {
delete this;
}
}
virtual FX_BOOL IsEOF()
{
return m_dwCurPos >= m_dwSize;
}
virtual FX_FILESIZE GetPosition()
{
return (FX_FILESIZE)m_dwCurPos;
}
virtual size_t ReadBlock(void* buffer, size_t size)
{
return 0;
}
virtual FX_BOOL ReadNextBlock(FX_BOOL bRestart = FALSE)
{
if (bRestart) {
m_dwCurPos = 0;
}
if (m_dwCurPos < m_dwSize) {
m_dwCurPos = m_dwSize;
return TRUE;
}
return FALSE;
}
virtual FX_LPCBYTE GetBlockBuffer()
{
return m_pBuffer;
}
virtual size_t GetBlockSize()
{
return m_dwSize;
}
virtual FX_FILESIZE GetBlockOffset()
{
return 0;
}
protected:
IFX_Allocator* m_pAllocator;
FX_LPCBYTE m_pBuffer;
size_t m_dwSize;
size_t m_dwCurPos;
};
#define FX_XMLDATASTREAM_BufferSize (32 * 1024)
class CXML_DataStmAcc : public IFX_BufferRead, public CFX_Object
{
public:
CXML_DataStmAcc(IFX_FileRead *pFileRead, IFX_Allocator* pAllocator = NULL)
: m_pAllocator(pAllocator)
, m_pFileRead(pFileRead)
, m_pBuffer(NULL)
, m_nStart(0)
, m_dwSize(0)
{
FXSYS_assert(m_pFileRead != NULL);
}
virtual ~CXML_DataStmAcc()
{
if (m_pBuffer) {
FX_Allocator_Free(m_pAllocator, m_pBuffer);
}
}
virtual void Release()
{
if (m_pAllocator) {
FX_DeleteAtAllocator(this, m_pAllocator, CXML_DataStmAcc);
} else {
delete this;
}
}
virtual FX_BOOL IsEOF()
{
return m_nStart + (FX_FILESIZE)m_dwSize >= m_pFileRead->GetSize();
}
virtual FX_FILESIZE GetPosition()
{
return m_nStart + (FX_FILESIZE)m_dwSize;
}
virtual size_t ReadBlock(void* buffer, size_t size)
{
return 0;
}
virtual FX_BOOL ReadNextBlock(FX_BOOL bRestart = FALSE)
{
if (bRestart) {
m_nStart = 0;
}
FX_FILESIZE nLength = m_pFileRead->GetSize();
m_nStart += (FX_FILESIZE)m_dwSize;
if (m_nStart >= nLength) {
return FALSE;
}
m_dwSize = (size_t)FX_MIN(FX_XMLDATASTREAM_BufferSize, nLength - m_nStart);
if (!m_pBuffer) {
m_pBuffer = FX_Allocator_Alloc(m_pAllocator, FX_BYTE, m_dwSize);
if (!m_pBuffer) {
return FALSE;
}
}
return m_pFileRead->ReadBlock(m_pBuffer, m_nStart, m_dwSize);
}
virtual FX_LPCBYTE GetBlockBuffer()
{
return (FX_LPCBYTE)m_pBuffer;
}
virtual size_t GetBlockSize()
{
return m_dwSize;
}
virtual FX_FILESIZE GetBlockOffset()
{
return m_nStart;
}
protected:
IFX_Allocator* m_pAllocator;
IFX_FileRead *m_pFileRead;
FX_LPBYTE m_pBuffer;
FX_FILESIZE m_nStart;
size_t m_dwSize;
};
class CXML_Parser
{
public:
CXML_Parser(IFX_Allocator* pAllocator = NULL) : m_pAllocator(pAllocator) {}
~CXML_Parser();
IFX_Allocator* m_pAllocator;
IFX_BufferRead* m_pDataAcc;
FX_BOOL m_bOwnedStream;
FX_FILESIZE m_nOffset;
FX_BOOL m_bSaveSpaceChars;
FX_LPCBYTE m_pBuffer;
size_t m_dwBufferSize;
FX_FILESIZE m_nBufferOffset;
size_t m_dwIndex;
FX_BOOL Init(FX_LPBYTE pBuffer, size_t size);
FX_BOOL Init(IFX_FileRead *pFileRead);
FX_BOOL Init(IFX_BufferRead *pBuffer);
FX_BOOL Init(FX_BOOL bOwndedStream);
FX_BOOL ReadNextBlock();
FX_BOOL IsEOF();
FX_BOOL HaveAvailData();
void SkipWhiteSpaces();
void GetName(CFX_ByteStringL &space, CFX_ByteStringL &name);
void GetAttrValue(CFX_WideStringL &value);
FX_DWORD GetCharRef();
void GetTagName(CFX_ByteStringL &space, CFX_ByteStringL &name, FX_BOOL &bEndTag, FX_BOOL bStartTag = FALSE);
void SkipLiterals(FX_BSTR str);
CXML_Element* ParseElement(CXML_Element* pParent, FX_BOOL bStartTag = FALSE);
void InsertContentSegment(FX_BOOL bCDATA, FX_WSTR content, CXML_Element* pElement);
void InsertCDATASegment(CFX_UTF8Decoder& decoder, CXML_Element* pElement);
};
void FX_XML_SplitQualifiedName(FX_BSTR bsFullName, CFX_ByteStringC &bsSpace, CFX_ByteStringC &bsName);
#endif