95a2f54683
git-svn-id: https://svn.code.sf.net/p/apophysis7x/svn/trunk@1 a5d1c0f9-a0e9-45c6-87dd-9d276e40c949
6373 lines
204 KiB
ObjectPascal
6373 lines
204 KiB
ObjectPascal
{ unit NativeXml
|
|
|
|
This is a small-footprint implementation to read and write XML documents
|
|
natively from Delpi code.
|
|
|
|
You can use this code to read XML documents from files, streams or strings.
|
|
The load routine generates events that can be used to display load progress
|
|
on the fly.
|
|
|
|
Note: any external encoding (ANSI, UTF16, etc) is converted to an internal
|
|
encoding that is ANSI or UTF8. When the loaded document is ANSI based,
|
|
the encoding will be ANSI, in other cases (UTF8, UTF16) the encoding
|
|
will be UTF8.
|
|
|
|
Original Author: Nils Haeck M.Sc. (n.haeck@simdesign.nl)
|
|
Original Date: 01 Apr 2003
|
|
Version: see below
|
|
Copyright (c) 2003-2010 Simdesign BV
|
|
Contributor(s): Stefan Glienke
|
|
|
|
It is NOT allowed under ANY circumstances to publish or copy this code
|
|
without accepting the license conditions in accompanying LICENSE.txt
|
|
first!
|
|
|
|
This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF
|
|
ANY KIND, either express or implied.
|
|
|
|
Please visit http://www.simdesign.nl/xml.html for more information.
|
|
}
|
|
unit NativeXml;
|
|
|
|
interface
|
|
|
|
{$i nativexml.inc}
|
|
|
|
uses
|
|
Windows,
|
|
{$IFDEF CLR}
|
|
System.Text,
|
|
{$ENDIF}
|
|
{$IFDEF USEGRAPHICS}
|
|
{$IFDEF LINUX}
|
|
QGraphics,
|
|
{$ELSE}
|
|
Graphics,
|
|
{$ENDIF}
|
|
{$ENDIF}
|
|
Classes,
|
|
SysUtils;
|
|
|
|
const
|
|
|
|
// Current version of the NativeXml unit
|
|
cNativeXmlVersion = '3.10';
|
|
|
|
// cross-platform pointer type
|
|
type
|
|
{$IFDEF CLR}
|
|
TPointer = TObject;
|
|
{$ELSE}
|
|
TPointer = Pointer;
|
|
{$ENDIF}
|
|
|
|
{$IFDEF D12UP}
|
|
// Delphi 2009 and up
|
|
type
|
|
UnicodeChar = Char;
|
|
PUnicodeChar = PChar;
|
|
{$ELSE}
|
|
// Delphi 2007 and below
|
|
type
|
|
UnicodeString = WideString;
|
|
UnicodeChar = WideChar;
|
|
PUnicodeChar = PWideChar;
|
|
RawByteString = AnsiString;
|
|
{$ENDIF}
|
|
|
|
type
|
|
|
|
// Note on TNativeXml.Format:
|
|
// - xfReadable (default) to be able to read the xml file with a standard editor.
|
|
// - xfCompact to save the xml fully compliant and at smallest size
|
|
TXmlFormatType = (
|
|
xfReadable, // Save in readable format with CR-LF and indents
|
|
xfCompact // Save without any control chars except LF after declarations
|
|
);
|
|
|
|
// TXmlElementType enumerates the different kinds of elements that can be found
|
|
// in the XML document.
|
|
TXmlElementType = (
|
|
xeNormal, // Normal element <name {attr}>[value][sub-elements]</name>
|
|
xeComment, // Comment <!--{comment}-->
|
|
xeCData, // literal data <![CDATA[{data}]]>
|
|
xeDeclaration, // XML declaration <?xml{declaration}?>
|
|
xeStylesheet, // Stylesheet <?xml-stylesheet{stylesheet}?>
|
|
xeDoctype, // DOCTYPE DTD declaration <!DOCTYPE{spec}>
|
|
xeElement, // <!ELEMENT >
|
|
xeAttList, // <!ATTLIST >
|
|
xeEntity, // <!ENTITY >
|
|
xeNotation, // <!NOTATION >
|
|
xeExclam, // Any <!data>
|
|
xeQuestion, // Any <?data?>
|
|
xeCharData, // character data in a node
|
|
xeUnknown // Any <data>
|
|
);
|
|
|
|
// Choose what kind of binary encoding will be used when calling
|
|
// TXmlNode BufferRead and BufferWrite.
|
|
TBinaryEncodingType = (
|
|
xbeBinHex, { With this encoding, each byte is stored as a hexadecimal
|
|
number, e.g. 0 = 00 and 255 = FF. }
|
|
xbeBase64 { With this encoding, each group of 3 bytes are stored as 4
|
|
characters, requiring 64 different AnsiCharacters.}
|
|
);
|
|
|
|
// Definition of different methods of String encoding.
|
|
TStringEncodingType = (
|
|
seAnsi, // General 8 bit encoding, encoding must be determined from encoding declaration
|
|
seUCS4BE, // UCS-4 Big Endian
|
|
seUCS4LE, // UCS-4 Little Endian
|
|
seUCS4_2143, // UCS-4 unusual octet order (2143)
|
|
seUCS4_3412, // UCS-4 unusual octet order (3412)
|
|
se16BitBE, // General 16 bit Big Endian, encoding must be determined from encoding declaration
|
|
se16BitLE, // General 16 bit Little Endian, encoding must be determined from encoding declaration
|
|
seUTF8, // UTF-8
|
|
seUTF16BE, // UTF-16 Big Endian
|
|
seUTF16LE, // UTF-16 Little Endian
|
|
seEBCDIC // EBCDIC flavour
|
|
);
|
|
|
|
TXmlCompareOption = (
|
|
xcNodeName,
|
|
xcNodeType,
|
|
xcNodeValue,
|
|
xcAttribCount,
|
|
xcAttribNames,
|
|
xcAttribValues,
|
|
xcChildCount,
|
|
xcChildNames,
|
|
xcChildValues,
|
|
xcRecursive
|
|
);
|
|
|
|
TXmlCompareOptions = set of TXmlCompareOption;
|
|
|
|
const
|
|
|
|
xcAll: TXmlCompareOptions = [xcNodeName, xcNodeType, xcNodeValue, xcAttribCount,
|
|
xcAttribNames, xcAttribValues, xcChildCount, xcChildNames, xcChildValues,
|
|
xcRecursive];
|
|
|
|
var
|
|
|
|
// XML Defaults
|
|
|
|
cDefaultEncodingString: UTF8String = 'UTF-8';
|
|
cDefaultExternalEncoding: TStringEncodingType = seUTF8;
|
|
cDefaultVersionString: UTF8String = '1.0';
|
|
cDefaultXmlFormat: TXmlFormatType = xfCompact;
|
|
cDefaultWriteOnDefault: boolean = True;
|
|
cDefaultBinaryEncoding: TBinaryEncodingType = xbeBase64;
|
|
cDefaultIndentString: UTF8String = ' ';
|
|
cDefaultDropCommentsOnParse: boolean = False;
|
|
cDefaultUseFullNodes: boolean = False;
|
|
cDefaultUseLocalBias: boolean = False;
|
|
cDefaultFloatAllowScientific: boolean = True;
|
|
cDefaultFloatSignificantDigits: integer = 6;
|
|
|
|
type
|
|
|
|
TXmlNode = class;
|
|
TNativeXml = class;
|
|
TsdCodecStream = class;
|
|
|
|
// An event that is based on the TXmlNode object Node.
|
|
TXmlNodeEvent = procedure(Sender: TObject; Node: TXmlNode) of object;
|
|
|
|
// An event that is used to indicate load or save progress.
|
|
TXmlProgressEvent = procedure(Sender: TObject; Size: integer) of object;
|
|
|
|
// This event is used in the TNativeXml.OnNodeCompare event, and should
|
|
// return -1 if Node1 < Node2, 0 if Node1 = Node2 and 1 if Node1 > Node2.
|
|
TXmlNodeCompareEvent = function(Sender: TObject; Node1, Node2: TXmlNode; Info: TPointer): integer of object;
|
|
|
|
// Pass a function of this kind to TXmlNode.SortChildNodes. The function should
|
|
// return -1 if Node1 < Node2, 0 if Node1 = Node2 and 1 if Node1 > Node2.
|
|
TXMLNodeCompareFunction = function(Node1, Node2: TXmlNode; Info: TPointer): integer;
|
|
|
|
// Very simple autonomous stringlist that holds the list of attributes in the node
|
|
TsdUTF8StringList = class(TPersistent)
|
|
private
|
|
FItems: array of UTF8String;
|
|
FCount: integer;
|
|
function GetItems(Index: integer): UTF8String;
|
|
procedure SetItems(Index: integer; const Value: UTF8String);
|
|
function GetValues(const Name: UTF8String): UTF8String;
|
|
function GetNames(Index: integer): UTF8String;
|
|
procedure SetValues(const Name, Value: UTF8String);
|
|
function GetText: UTF8String;
|
|
public
|
|
function Add(const S: UTF8String): integer;
|
|
procedure Assign(Source: TPersistent); override;
|
|
procedure Clear;
|
|
procedure Delete(Index: Integer);
|
|
function IndexOfName(const Name: UTF8String): integer;
|
|
property Count: integer read FCount;
|
|
property Items[Index: integer]: UTF8String read GetItems write SetItems; default;
|
|
property Names[Index: integer]: UTF8String read GetNames;
|
|
property Values[const Name: UTF8String]: UTF8String read GetValues write SetValues;
|
|
property Text: UTF8String read GetText;
|
|
end;
|
|
|
|
// The TXmlNode represents an element in the XML file. Each TNativeXml holds
|
|
// one Root element. Under ths root element, sub-elements can be nested (there
|
|
// is no limit on how deep). Property ElementType defines what kind of element
|
|
// this node is.
|
|
TXmlNode = class(TPersistent)
|
|
private
|
|
FName: UTF8String; // The element name
|
|
FValue: UTF8String; // The *escaped* value
|
|
FAttributes: TsdUTF8StringList; // List with attributes
|
|
FNodes: TList; // These are the child elements
|
|
FParent: TXmlNode; // Pointer to parent element
|
|
FDocument: TNativeXml; // Pointer to parent XmlDocument
|
|
FElementType: TXmlElementType; // The type of element
|
|
FTag: integer; // A value the developer can use
|
|
function AbortParsing: boolean;
|
|
function GetValueAsString: UTF8String;
|
|
procedure SetAttributeName(Index: integer; const Value: UTF8String);
|
|
procedure SetAttributeValue(Index: integer; const Value: UTF8String);
|
|
procedure SetValueAsString(const AValue: UTF8String);
|
|
function GetIndent: UTF8String;
|
|
function GetLineFeed: UTF8String;
|
|
function GetTreeDepth: integer;
|
|
function GetAttributeCount: integer;
|
|
function GetAttributePair(Index: integer): UTF8String;
|
|
function GetAttributeName(Index: integer): UTF8String;
|
|
function GetAttributeValue(Index: integer): UTF8String;
|
|
function GetWriteOnDefault: boolean;
|
|
function GetBinaryEncoding: TBinaryEncodingType;
|
|
function GetCascadedName: UTF8String;
|
|
function QualifyAsDirectNode: boolean;
|
|
procedure SetName(const Value: UTF8String);
|
|
function GetFullPath: UTF8String;
|
|
procedure SetBinaryEncoding(const Value: TBinaryEncodingType);
|
|
function GetBinaryString: RawByteString;
|
|
procedure SetBinaryString(const Value: RawByteString);
|
|
function UseFullNodes: boolean;
|
|
function UseLocalBias: Boolean;
|
|
function GetValueAsUnicodeString: UnicodeString;
|
|
procedure SetValueAsUnicodeString(const Value: UnicodeString);
|
|
function GetAttributeByName(const AName: UTF8String): UTF8String;
|
|
procedure SetAttributeByName(const AName, Value: UTF8String);
|
|
function GetValueAsInteger: integer;
|
|
procedure SetValueAsInteger(const Value: integer);
|
|
function GetValueAsFloat: double;
|
|
procedure SetValueAsFloat(const Value: double);
|
|
function GetValueAsDateTime: TDateTime;
|
|
procedure SetValueAsDateTime(const Value: TDateTime);
|
|
function GetValueAsBool: boolean;
|
|
procedure SetValueAsBool(const Value: boolean);
|
|
function GetValueAsInt64: int64;
|
|
procedure SetValueAsInt64(const Value: int64);
|
|
procedure CheckCreateAttributesList;
|
|
function GetAttributeValueAsUnicodeString(Index: integer): UnicodeString;
|
|
procedure SetAttributeValueAsUnicodeString(Index: integer;
|
|
const Value: UnicodeString);
|
|
function GetAttributeValueAsInteger(Index: integer): integer;
|
|
procedure SetAttributeValueAsInteger(Index: integer;
|
|
const Value: integer);
|
|
function GetAttributeByNameWide(const AName: UTF8String): UnicodeString;
|
|
procedure SetAttributeByNameWide(const AName: UTF8String;
|
|
const Value: UnicodeString);
|
|
function GetTotalNodeCount: integer;
|
|
function FloatSignificantDigits: integer;
|
|
function FloatAllowScientific: boolean;
|
|
function GetAttributeValueDirect(Index: integer): UTF8String;
|
|
procedure SetAttributeValueDirect(Index: integer; const Value: UTF8String);
|
|
protected
|
|
function CompareNodeName(const NodeName: UTF8String): integer;
|
|
procedure DeleteEmptyAttributes;
|
|
function GetNodes(Index: integer): TXmlNode; virtual;
|
|
function GetNodeCount: integer; virtual;
|
|
procedure ParseTag(const AValue: UTF8String; TagStart, TagClose: integer);
|
|
procedure ReadFromStream(S: TStream); virtual;
|
|
procedure ReadFromString(const AValue: UTF8String); virtual;
|
|
procedure ResolveEntityReferences;
|
|
function UnescapeString(const AValue: UTF8String): UTF8String; virtual;
|
|
function WriteInnerTag: UTF8String; virtual;
|
|
procedure WriteToStream(S: TStream); virtual;
|
|
procedure ChangeDocument(ADocument: TNativeXml);
|
|
public
|
|
// Create a new TXmlNode object. ADocument must be the TNativeXml that is
|
|
// going to hold this new node.
|
|
constructor Create(ADocument: TNativeXml); virtual;
|
|
// \Create a new TXmlNode with name AName. ADocument must be the TNativeXml
|
|
// that is going to hold this new node.
|
|
constructor CreateName(ADocument: TNativeXml; const AName: UTF8String); virtual;
|
|
// \Create a new TXmlNode with name AName and UTF8String value AValue. ADocument
|
|
// must be the TNativeXml that is going to hold this new node.
|
|
constructor CreateNameValue(ADocument: TNativeXml; const AName, AValue: UTF8String); virtual;
|
|
// \Create a new TXmlNode with XML element type AType. ADocument must be the
|
|
// TNativeXml that is going to hold this new node.
|
|
constructor CreateType(ADocument: TNativeXml; AType: TXmlElementType); virtual;
|
|
// Use Assign to assign another TXmlNode to this node. This means that all
|
|
// properties and subnodes from the Source TXmlNode are copied to the current
|
|
// node. You can also Assign a TNativeXml document to the node, in that case
|
|
// the RootNodeList property of the TNativeXml object will be copied.
|
|
procedure Assign(Source: TPersistent); override;
|
|
// Call Delete to delete this node completely from the parent node list. This
|
|
// call only succeeds if the node has a parent. It has no effect when called for
|
|
// the root node.
|
|
procedure Delete; virtual;
|
|
// \Delete all nodes that are empty (this means, which have no subnodes, no
|
|
// attributes, and no value assigned). This procedure works recursively.
|
|
procedure DeleteEmptyNodes;
|
|
// Destroy a TXmlNode object. This will free the child node list automatically.
|
|
// Never call this method directly. All TXmlNodes in the document will be
|
|
// recursively freed when TNativeXml.Free is called.
|
|
destructor Destroy; override;
|
|
// Use this method to add an integer attribute to the node.
|
|
procedure AttributeAdd(const AName: UTF8String; AValue: integer); overload;
|
|
// Use this method to add a string attribute with value AValue to the node.
|
|
procedure AttributeAdd(const AName, AValue: UTF8String); overload;
|
|
// Use this method to delete the attribute at Index in the list. Index must be
|
|
// equal or greater than 0, and smaller than AttributeCount. Using an index
|
|
// outside of that range has no effect.
|
|
procedure AttributeDelete(Index: integer);
|
|
// Switch position of the attributes at Index1 and Index2.
|
|
procedure AttributeExchange(Index1, Index2: integer);
|
|
// Use this method to find the index of an attribute with name AName.
|
|
function AttributeIndexByname(const AName: UTF8String): integer;
|
|
// \Clear all attributes from the current node.
|
|
procedure AttributesClear; virtual;
|
|
// Use this method to read binary data from the node into Buffer with a length of Count.
|
|
procedure BufferRead(var Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Count: Integer); virtual;
|
|
// Use this method to write binary data in Buffer with a length of Count to the
|
|
// current node. The data will appear as text using either BinHex or Base64
|
|
// method) in the final XML document.
|
|
// Notice that NativeXml does only support up to 2Gb bytes of data per file,
|
|
// so do not use this option for huge files. The binary encoding method (converting
|
|
// binary data into text) can be selected using property BinaryEncoding.
|
|
// xbeBase64 is most efficient, but slightly slower. Always use identical methods
|
|
// for reading and writing.
|
|
procedure BufferWrite(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Count: Integer); virtual;
|
|
// Returns the length of the data in the buffer, once it would be decoded by
|
|
// method xbeBinHex or xbeBase64. If BinaryEncoding is xbeSixBits, this function
|
|
// cannot be used. The length of the unencoded data is determined from the
|
|
// length of the encoded data. For xbeBinHex this is trivial (just half the
|
|
// length), for xbeBase64 this is more difficult (must use the padding characters)
|
|
function BufferLength: integer; virtual;
|
|
// Clear all child nodes and attributes, and the name and value of the current
|
|
// XML node. However, the node is not deleted. Call Delete instead for that.
|
|
procedure Clear; virtual;
|
|
// Find the first node which has name NodeName. Contrary to the NodeByName
|
|
// function, this function will search the whole subnode tree, using the
|
|
// DepthFirst method. It is possible to search for a full path too, e.g.
|
|
// FoundNode := MyNode.FindNode('/Root/SubNode1/SubNode2/ThisNode');
|
|
function FindNode(const NodeName: UTF8String): TXmlNode;
|
|
// Find all nodes which have name NodeName. Contrary to the NodesByName
|
|
// function, this function will search the whole subnode tree. If you use
|
|
// a TXmlNodeList for the AList parameter, you don't need to cast the list
|
|
// items to TXmlNode.
|
|
procedure FindNodes(const NodeName: UTF8String; const AList: TList);
|
|
// Use FromAnsiString to convert a normal ANSI String to a UTF8String for the node
|
|
// (name, value, attributes). In TNativeXml the ANSI Characters are encoded
|
|
// into UTF8.
|
|
function FromAnsiString(const s: AnsiString): UTF8String;
|
|
// Use FromUnicodeString to convert UnicodeString to a UTF8String for the node (name, value,
|
|
// attributes).
|
|
function FromUnicodeString(const W: UnicodeString): UTF8String;
|
|
// Use HasAttribute to determine if the node has an attribute with name AName.
|
|
function HasAttribute(const AName: UTF8String): boolean; virtual;
|
|
// This function returns the index of this node in the parent's node list.
|
|
// If Parent is not assigned, this function returns -1.
|
|
function IndexInParent: integer;
|
|
// This function returns True if the node has no subnodes and no attributes,
|
|
// and if the node Name and value are empty.
|
|
function IsClear: boolean; virtual;
|
|
// This function returns True if the node has no subnodes and no attributes,
|
|
// and if the node value is empty.
|
|
function IsEmpty: boolean; virtual;
|
|
function IsEqualTo(ANode: TXmlNode; Options: TXmlCompareOptions; MismatchNodes: TList = nil): boolean;
|
|
// Add the node ANode as a new subelement in the nodelist. The node will be
|
|
// added in position NodeCount (which will be returned).
|
|
function NodeAdd(ANode: TXmlNode): integer; virtual;
|
|
// This function returns a pointer to the first subnode that has an attribute with
|
|
// name AttribName and value AttribValue. If ShouldRecurse = True (default), the
|
|
// function works recursively, using the depthfirst method.
|
|
function NodeByAttributeValue(const NodeName, AttribName, AttribValue: UTF8String;
|
|
ShouldRecurse: boolean = True): TXmlNode;
|
|
// Return a pointer to the first subnode with this Elementype, or return nil
|
|
// if no subnode with that type is found.
|
|
function NodeByElementType(ElementType: TXmlElementType): TXmlNode;
|
|
// Return a pointer to the first subnode in the nodelist that has name AName.
|
|
// If no subnodes with AName are found, the function returns nil.
|
|
function NodeByName(const AName: UTF8String): TXmlNode; virtual;
|
|
// \Delete the subnode at Index. The node will also be freed, so do not free the
|
|
// node in the application.
|
|
procedure NodeDelete(Index: integer); virtual;
|
|
// Switch position of the nodes at Index1 and Index2.
|
|
procedure NodeExchange(Index1, Index2: integer);
|
|
// Extract the node ANode from the subnode list. The node will no longer appear
|
|
// in the subnodes list, so the application is responsible for freeing ANode later.
|
|
function NodeExtract(ANode: TXmlNode): TXmlNode; virtual;
|
|
// This function returns a pointer to the first node with AName. If this node
|
|
// is not found, then it creates a new node with AName and returns its pointer.
|
|
function NodeFindOrCreate(const AName: UTF8String): TXmlNode; virtual;
|
|
// Find the index of the first subnode with name AName.
|
|
function NodeIndexByName(const AName: UTF8String): integer; virtual;
|
|
// Find the index of the first subnode with name AName that appears after or on
|
|
// the index AFrom. This function can be used in a loop to retrieve all nodes
|
|
// with a certain name, without using a helper list. See also NodesByName.
|
|
function NodeIndexByNameFrom(const AName: UTF8String; AFrom: integer): integer; virtual;
|
|
// Call NodeIndexOf to get the index for ANode in the Nodes array. The first
|
|
// node in the array has index 0, the second item has index 1, and so on. If
|
|
// a node is not in the list, NodeIndexOf returns -1.
|
|
function NodeIndexOf(ANode: TXmlNode): integer;
|
|
// Insert the node ANode at location Index in the list.
|
|
procedure NodeInsert(Index: integer; ANode: TXmlNode); virtual;
|
|
// \Create a new node with AName, add it to the subnode list, and return a
|
|
// pointer to it.
|
|
function NodeNew(const AName: UTF8String): TXmlNode; virtual;
|
|
// \Create a new node with AName, and insert it into the subnode list at location
|
|
// Index, and return a pointer to it.
|
|
function NodeNewAtIndex(Index: integer; const AName: UTF8String): TXmlNode; virtual;
|
|
// Call NodeRemove to remove a specific node from the Nodes array when its index
|
|
// is unknown. The value returned is the index of the item in the Nodes array
|
|
// before it was removed. After an item is removed, all the items that follow
|
|
// it are moved up in index position and the NodeCount is reduced by one.
|
|
function NodeRemove(ANode: TxmlNode): integer;
|
|
// \Clear (and free) the complete list of subnodes.
|
|
procedure NodesClear; virtual;
|
|
// Use this procedure to retrieve all nodes that have name AName. Pointers to
|
|
// these nodes are added to the list in AList. AList must be initialized
|
|
// before calling this procedure. If you use a TXmlNodeList you don't need
|
|
// to cast the list items to TXmlNode.
|
|
procedure NodesByName(const AName: UTF8String; const AList: TList);
|
|
// Find the attribute with AName, and convert its value to a boolean. If the
|
|
// attribute is not found, or cannot be converted, the default ADefault will
|
|
// be returned.
|
|
function ReadAttributeBool(const AName: UTF8String; ADefault: boolean = False): boolean; virtual;
|
|
function ReadAttributeDateTime(const AName: UTF8String; ADefault: TDateTime = 0): TDateTime; virtual;
|
|
// Find the attribute with AName, and convert its value to an integer. If the
|
|
// attribute is not found, or cannot be converted, the default ADefault will
|
|
// be returned.
|
|
function ReadAttributeInteger(const AName: UTF8String; ADefault: integer = 0): integer; virtual;
|
|
// Find the attribute with AName, and convert its value to an int64. If the
|
|
// attribute is not found, or cannot be converted, the default ADefault will
|
|
// be returned.
|
|
function ReadAttributeInt64(const AName: UTF8String; ADefault: int64 = 0): int64; virtual;
|
|
// Find the attribute with AName, and convert its value to a float. If the
|
|
// attribute is not found, or cannot be converted, the default ADefault will
|
|
// be returned.
|
|
function ReadAttributeFloat(const AName: UTF8String; ADefault: double = 0): double;
|
|
function ReadAttributeString(const AName: UTF8String; const ADefault: UTF8String = ''): UTF8String; virtual;
|
|
// Read the subnode with AName and convert it to a boolean value. If the
|
|
// subnode is not found, or cannot be converted, the boolean ADefault will
|
|
// be returned.
|
|
function ReadBool(const AName: UTF8String; ADefault: boolean = False): boolean; virtual;
|
|
{$IFDEF USEGRAPHICS}
|
|
// Read the properties Color and Style for the TBrush object ABrush from the
|
|
// subnode with AName.
|
|
procedure ReadBrush(const AName: UTF8String; ABrush: TBrush); virtual;
|
|
// Read the subnode with AName and convert its value to TColor. If the
|
|
// subnode is not found, or cannot be converted, ADefault will be returned.
|
|
function ReadColor(const AName: UTF8String; ADefault: TColor = clBlack): TColor; virtual;
|
|
// Read the properties \Name, Color, Size and Style for the TFont object AFont
|
|
// from the subnode with AName.
|
|
procedure ReadFont(const AName: UTF8String; AFont: TFont); virtual;
|
|
// Read the properties Color, Mode, Style and Width for the TPen object APen
|
|
// from the subnode with AName.
|
|
procedure ReadPen(const AName: UTF8String; APen: TPen); virtual;
|
|
{$ENDIF}
|
|
// Read the subnode with AName and convert its value to TDateTime. If the
|
|
// subnode is not found, or cannot be converted, ADefault will be returned.
|
|
function ReadDateTime(const AName: UTF8String; ADefault: TDateTime = 0): TDateTime; virtual;
|
|
// Read the subnode with AName and convert its value to a double. If the
|
|
// subnode is not found, or cannot be converted, ADefault will be returned.
|
|
function ReadFloat(const AName: UTF8String; ADefault: double = 0.0): double; virtual;
|
|
// Read the subnode with AName and convert its value to an int64. If the
|
|
// subnode is not found, or cannot be converted, ADefault will be returned.
|
|
function ReadInt64(const AName: UTF8String; ADefault: int64 = 0): int64; virtual;
|
|
// Read the subnode with AName and convert its value to an integer. If the
|
|
// subnode is not found, or cannot be converted, ADefault will be returned.
|
|
function ReadInteger(const AName: UTF8String; ADefault: integer = 0): integer; virtual;
|
|
// Read the subnode with AName and return its UTF8String value. If the subnode is
|
|
// not found, ADefault will be returned.
|
|
function ReadString(const AName: UTF8String; const ADefault: UTF8String = ''): UTF8String; virtual;
|
|
// Read the subnode with AName and return its UnicodeString value. If the subnode is
|
|
// not found, ADefault will be returned.
|
|
function ReadUnicodeString(const AName: UTF8String; const ADefault: UnicodeString = ''): UnicodeString; virtual;
|
|
// Sort the child nodes of this node. Provide a custom node compare function in Compare,
|
|
// or attach an event handler to the parent documents' OnNodeCompare in order to
|
|
// provide custom sorting. If no compare function is given (nil) and OnNodeCompare
|
|
// is not implemented, SortChildNodes will simply sort the nodes by name (ascending,
|
|
// case insensitive). The Info pointer parameter can be used to pass any custom
|
|
// information to the compare function. Default value for Info is nil.
|
|
procedure SortChildNodes(Compare: TXMLNodeCompareFunction = nil; Info: TPointer = nil);
|
|
// Use ToUnicodeString to convert any UTF8 String from the node (name, value, attributes)
|
|
// to a UnicodeString.
|
|
function ToUnicodeString(const s: UTF8String): UnicodeString;
|
|
// Convert the node's value to boolean and return the result. If this conversion
|
|
// fails, or no value is found, then the function returns ADefault.
|
|
function ValueAsBoolDef(ADefault: boolean): boolean; virtual;
|
|
// Convert the node's value to a TDateTime and return the result. If this conversion
|
|
// fails, or no value is found, then the function returns ADefault.
|
|
function ValueAsDateTimeDef(ADefault: TDateTime): TDateTime; virtual;
|
|
// Convert the node's value to a double and return the result. If this conversion
|
|
// fails, or no value is found, then the function returns ADefault.
|
|
function ValueAsFloatDef(ADefault: double): double; virtual;
|
|
// Convert the node's value to int64 and return the result. If this conversion
|
|
// fails, or no value is found, then the function returns ADefault.
|
|
function ValueAsInt64Def(ADefault: int64): int64; virtual;
|
|
// Convert the node's value to integer and return the result. If this conversion
|
|
// fails, or no value is found, then the function returns ADefault.
|
|
function ValueAsIntegerDef(ADefault: integer): integer; virtual;
|
|
// If the attribute with name AName exists, then set its value to the boolean
|
|
// AValue. If it does not exist, then create a new attribute AName with the
|
|
// boolean value converted to either "True" or "False". If ADefault = AValue, and
|
|
// WriteOnDefault = False, no attribute will be added.
|
|
procedure WriteAttributeBool(const AName: UTF8String; AValue: boolean; ADefault: boolean = False); virtual;
|
|
procedure WriteAttributeDateTime(const AName: UTF8string; AValue: TDateTime; ADefault: TDateTime = 0); virtual;
|
|
// If the attribute with name AName exists, then set its value to the integer
|
|
// AValue. If it does not exist, then create a new attribute AName with the
|
|
// integer value converted to a quoted string. If ADefault = AValue, and
|
|
// WriteOnDefault = False, no attribute will be added.
|
|
procedure WriteAttributeInteger(const AName: UTF8String; AValue: integer; ADefault: integer = 0); virtual;
|
|
procedure WriteAttributeInt64(const AName: UTF8String; const AValue: int64; ADefault: int64 = 0); virtual;
|
|
procedure WriteAttributeFloat(const AName: UTF8String; AValue: double; ADefault: double = 0); virtual;
|
|
// If the attribute with name AName exists, then set its value to the UTF8String
|
|
// AValue. If it does not exist, then create a new attribute AName with the
|
|
// value AValue. If ADefault = AValue, and WriteOnDefault = False, no attribute
|
|
// will be added.
|
|
procedure WriteAttributeString(const AName: UTF8String; const AValue: UTF8String; const ADefault: UTF8String = ''); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the boolean
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteBool(const AName: UTF8String; AValue: boolean; ADefault: boolean = False); virtual;
|
|
{$IFDEF USEGRAPHICS}
|
|
// Write properties Color and Style of the TBrush object ABrush to the subnode
|
|
// with AName. If AName does not exist, it will be created.
|
|
procedure WriteBrush(const AName: UTF8String; ABrush: TBrush); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the TColor
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteColor(const AName: UTF8String; AValue: TColor; ADefault: TColor = clBlack); virtual;
|
|
// Write properties \Name, Color, Size and Style of the TFont object AFont to
|
|
// the subnode with AName. If AName does not exist, it will be created.
|
|
procedure WriteFont(const AName: UTF8String; AFont: TFont); virtual;
|
|
// Write properties Color, Mode, Style and Width of the TPen object APen to
|
|
// the subnode with AName. If AName does not exist, it will be created.
|
|
procedure WritePen(const AName: UTF8String; APen: TPen); virtual;
|
|
{$ENDIF}
|
|
// Add or replace the subnode with AName and set its value to represent the TDateTime
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
// The XML format used is compliant with W3C's specification of date and time.
|
|
procedure WriteDateTime(const AName: UTF8String; AValue: TDateTime; ADefault: TDateTime = 0); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the double
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteFloat(const AName: UTF8String; AValue: double; ADefault: double = 0.0); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the hexadecimal representation of
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteHex(const AName: UTF8String; AValue: integer; Digits: integer; ADefault: integer = 0); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the int64
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteInt64(const AName: UTF8String; AValue: int64; ADefault: int64 = 0); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the integer
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteInteger(const AName: UTF8String; AValue: integer; ADefault: integer = 0); virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the UTF8String
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteString(const AName, AValue: UTF8String; const ADefault: UTF8String = ''); virtual;
|
|
// Call WriteToString to save the XML node to a UTF8String. This method can be used to store
|
|
// individual nodes instead of the complete XML document.
|
|
function WriteToString: UTF8String; virtual;
|
|
// Add or replace the subnode with AName and set its value to represent the UnicodeString
|
|
// AValue. If AValue = ADefault, and WriteOnDefault = False, no subnode will be added.
|
|
procedure WriteUnicodeString(const AName: UTF8String; const AValue: UnicodeString; const ADefault: UnicodeString = ''); virtual;
|
|
// AttributeByName returns the attribute value for the attribute that has name AName.
|
|
// Set AttributeByName to add an attribute to the attribute list, or replace an
|
|
// existing one.
|
|
property AttributeByName[const AName: UTF8String]: UTF8String read GetAttributeByName write
|
|
SetAttributeByName;
|
|
// AttributeByNameWide returns the attribute value for the attribute that has name AName
|
|
// as UnicodeString. Set AttributeByNameWide to add an attribute to the attribute list, or replace an
|
|
// existing one.
|
|
property AttributeByNameWide[const AName: UTF8String]: UnicodeString read GetAttributeByNameWide write
|
|
SetAttributeByNameWide;
|
|
// Returns the number of attributes in the current node.
|
|
property AttributeCount: integer read GetAttributeCount;
|
|
// Read this property to get the name of the attribute at Index. Note that Index
|
|
// is zero-based: Index goes from 0 to AttributeCount - 1
|
|
property AttributeName[Index: integer]: UTF8String read GetAttributeName write SetAttributeName;
|
|
// Read this property to get the Attribute \Name and Value pair at index Index.
|
|
// This is a UTF8String with \Name and Value separated by a TAB character (#9).
|
|
property AttributePair[Index: integer]: UTF8String read GetAttributePair;
|
|
// Read this property to get the UTF8String value of the attribute at index Index.
|
|
// Write to it to set the UTF8String value.
|
|
property AttributeValue[Index: integer]: UTF8String read GetAttributeValue write SetAttributeValue;
|
|
// Read this property to get the UnicodeString value of the attribute at index Index.
|
|
// Write to it to set the UnicodeString value.
|
|
property AttributeValueAsUnicodeString[Index: integer]: UnicodeString read GetAttributeValueAsUnicodeString write SetAttributeValueAsUnicodeString;
|
|
// Read this property to get the integer value of the attribute at index Index.
|
|
// If the value cannot be converted, 0 will be returned. Write to it to set the integer value.
|
|
property AttributeValueAsInteger[Index: integer]: integer read GetAttributeValueAsInteger write SetAttributeValueAsInteger;
|
|
// Set or get the raw attribute value, thus circumventing the escape function. Make sure that
|
|
// the value you set does not contain the & and quote AnsiCharacters, or the produced
|
|
// XML will be invalid.
|
|
property AttributeValueDirect[Index: integer]: UTF8String read GetAttributeValueDirect write SetAttributeValueDirect;
|
|
// BinaryEncoding reflects the same value as the BinaryEncoding setting of the parent
|
|
// Document.
|
|
property BinaryEncoding: TBinaryEncodingType read GetBinaryEncoding write SetBinaryEncoding;
|
|
// Use BinaryString to add/extract binary data in an easy way to/from the node. Internally the
|
|
// data gets stored as Base64-encoded data. Do not use this method for normal textual
|
|
// information, it is better to use ValueAsString in that case (adds less overhead).
|
|
property BinaryString: RawByteString read GetBinaryString write SetBinaryString;
|
|
// This property returns the name and index and all predecessors with underscores
|
|
// to separate, in order to get a unique reference that can be used in filenames.
|
|
property CascadedName: UTF8String read GetCascadedName;
|
|
// Pointer to parent NativeXml document, or Nil if none.
|
|
property Document: TNativeXml read FDocument write FDocument;
|
|
// ElementType contains the type of element that this node holds.
|
|
property ElementType: TXmlElementType read FElementType write FElementType;
|
|
// Fullpath will return the complete path of the node from the root, e.g.
|
|
// /Root/SubNode1/SubNode2/ThisNode
|
|
property FullPath: UTF8String read GetFullPath;
|
|
// Read Name to get the name of the element, and write Name to set the name.
|
|
// This is the full name and may include a namespace. (Namespace:Name)
|
|
property Name: UTF8String read FName write SetName;
|
|
// Parent points to the parent node of the current XML node.
|
|
property Parent: TXmlNode read FParent write FParent;
|
|
// NodeCount is the number of child nodes that this node holds. In order to
|
|
// loop through all child nodes, use a construct like this:
|
|
// <CODE>
|
|
// with MyNode do
|
|
// for i := 0 to NodeCount - 1 do
|
|
// with Nodes[i] do
|
|
// ..processing here
|
|
// </CODE>
|
|
property NodeCount: integer read GetNodeCount;
|
|
// Use Nodes to access the child nodes of the current XML node by index. Note
|
|
// that the list is zero-based, so Index is valid from 0 to NodeCount - 1.
|
|
property Nodes[Index: integer]: TXmlNode read GetNodes; default;
|
|
// Tag is an integer value the developer can use in any way. Tag does not get
|
|
// saved to the XML. Tag is often used to point to a GUI element (and is then
|
|
// cast to a pointer).
|
|
property Tag: integer read FTag write FTag;
|
|
// TotalNodeCount represents the total number of child nodes, and child nodes
|
|
// of child nodes etcetera of this particular node. Use the following to get
|
|
// the total number of nodes in the XML document:
|
|
// <CODE>
|
|
// Total := MyDoc.RootNodes.TotalNodeCount;
|
|
// </CODE>
|
|
property TotalNodeCount: integer read GetTotalNodeCount;
|
|
// Read TreeDepth to find out many nested levels there are for the current XML
|
|
// node. Root has a TreeDepth of zero.
|
|
property TreeDepth: integer read GetTreeDepth;
|
|
// ValueAsBool returns the node's value as boolean, or raises an
|
|
// exception if the value cannot be converted to boolean. Set ValueAsBool
|
|
// to convert a boolean to a UTF8String in the node's value field. See also
|
|
// function ValueAsBoolDef.
|
|
property ValueAsBool: boolean read GetValueAsBool write SetValueAsBool;
|
|
// ValueAsDateTime returns the node's value as TDateTime, or raises an
|
|
// exception if the value cannot be converted to TDateTime. Set ValueAsDateTime
|
|
// to convert a TDateTime to a UTF8String in the node's value field. See also
|
|
// function ValueAsDateTimeDef.
|
|
property ValueAsDateTime: TDateTime read GetValueAsDateTime write SetValueAsDateTime;
|
|
// ValueAsIn64 returns the node's value as int64, or raises an
|
|
// exception if the value cannot be converted to int64. Set ValueAsInt64
|
|
// to convert an int64 to a UTF8String in the node's value field. See also
|
|
// function ValueAsInt64Def.
|
|
property ValueAsInt64: int64 read GetValueAsInt64 write SetValueAsInt64;
|
|
// ValueAsInteger returns the node's value as integer, or raises an
|
|
// exception if the value cannot be converted to integer. Set ValueAsInteger
|
|
// to convert an integer to a UTF8String in the node's value field. See also
|
|
// function ValueAsIntegerDef.
|
|
property ValueAsInteger: integer read GetValueAsInteger write SetValueAsInteger;
|
|
// ValueAsFloat returns the node's value as float, or raises an
|
|
// exception if the value cannot be converted to float. Set ValueAsFloat
|
|
// to convert a float to a UTF8String in the node's value field. See also
|
|
// function ValueAsFloatDef.
|
|
property ValueAsFloat: double read GetValueAsFloat write SetValueAsFloat;
|
|
// ValueAsString returns the unescaped version of ValueDirect. All neccesary
|
|
// characters in ValueDirect must be escaped (e.g. "&" becomes "&") but
|
|
// ValueAsString returns them in original format. Always use ValueAsString to
|
|
// set the text value of a node, to make sure all neccesary charaters are
|
|
// escaped.
|
|
property ValueAsString: UTF8String read GetValueAsString write SetValueAsString;
|
|
// ValueAsUnicodeString returns the unescaped version of ValueDirect as a UnicodeString.
|
|
// Always use ValueAsUnicodeString to set the text value of a node, to make sure all
|
|
// neccesary charaters are escaped.
|
|
property ValueAsUnicodeString: UnicodeString read GetValueAsUnicodeString write SetValueAsUnicodeString;
|
|
// ValueDirect is the exact text value as was parsed from the stream. If multiple
|
|
// text elements are encountered, they are added to ValueDirect with a CR to
|
|
// separate them.
|
|
property ValueDirect: UTF8String read FValue write FValue;
|
|
// WriteOnDefault reflects the same value as the WriteOnDefault setting of the parent
|
|
// Document.
|
|
property WriteOnDefault: boolean read GetWriteOnDefault;
|
|
end;
|
|
|
|
// TXmlNodeList is a utility TList descendant that can be used to work with selection
|
|
// lists. An example:
|
|
// <code>
|
|
// procedure FindAllZips(ANode: TXmlNode);
|
|
// var
|
|
// i: integer;
|
|
// AList: TXmlNodeList;
|
|
// begin
|
|
// AList := TXmlNodeList.Create;
|
|
// try
|
|
// // Get a list of all nodes named 'ZIP'
|
|
// ANode.NodesByName('ZIP', AList);
|
|
// for i := 0 to AList.Count - 1 do
|
|
// // Write the value of the node to output. Since AList[i] will be
|
|
// // of type TXmlNode, we can directly access the Value property.
|
|
// WriteLn(AList[i].Value);
|
|
// finally
|
|
// AList.Free;
|
|
// end;
|
|
// end;
|
|
// </code>
|
|
TXmlNodeList = class(TList)
|
|
private
|
|
function GetItems(Index: Integer): TXmlNode;
|
|
procedure SetItems(Index: Integer; const Value: TXmlNode);
|
|
public
|
|
// Return the first node in the list that has an attribute with AName, AValue
|
|
function ByAttribute(const AName, AValue: UTF8String): TXmlNode;
|
|
property Items[Index: Integer]: TXmlNode read GetItems write SetItems; default;
|
|
end;
|
|
|
|
// TNativeXml is the XML document holder. Create a TNativeXml and then use
|
|
// methods LoadFromFile, LoadFromStream or ReadFromString to load an XML document
|
|
// into memory. Or start from scratch and use Root.NodeNew to add nodes and
|
|
// eventually SaveToFile and SaveToStream to save the results as an XML document.
|
|
// Use property Xmlformat = xfReadable to ensure that indented (readable) output
|
|
// is produced.
|
|
TNativeXml = class(TPersistent)
|
|
private
|
|
FAbortParsing: boolean; // Signal to abort the parsing process
|
|
FBinaryEncoding: TBinaryEncodingType; // xbeBinHex or xbeBase64
|
|
FCodecStream: TsdCodecStream; // Temporary stream used to read encoded files
|
|
FDropCommentsOnParse: boolean; // If true, comments are dropped (deleted) when parsing
|
|
FExternalEncoding: TStringEncodingType;
|
|
FFloatAllowScientific: boolean;
|
|
FFloatSignificantDigits: integer;
|
|
FParserWarnings: boolean; // Show parser warnings for non-critical errors
|
|
FRootNodes: TXmlNode; // Root nodes in the document (which contains one normal element that is the root)
|
|
FIndentString: UTF8String; // The indent string used to indent content (default is two spaces)
|
|
FUseFullNodes: boolean; // If true, nodes are never written in short notation.
|
|
FUseLocalBias: Boolean; // If true, datetime values are written with timezone offset and converted to local time when read
|
|
FWriteOnDefault: boolean; // Set this option to "False" to only write values <> default value (default = true)
|
|
FXmlFormat: TXmlFormatType; // xfReadable, xfCompact
|
|
FOnNodeCompare: TXmlNodeCompareEvent; // Compare two nodes
|
|
FOnNodeNew: TXmlNodeEvent; // Called after a node is added
|
|
FOnNodeLoaded: TXmlNodeEvent; // Called after a node is loaded completely
|
|
FOnProgress: TXmlProgressEvent; // Called after a node is loaded/saved, with the current position in the file
|
|
FOnUnicodeLoss: TNotifyEvent; // This event is called when there is a warning for unicode conversion loss when reading unicode
|
|
procedure DoNodeNew(Node: TXmlNode);
|
|
procedure DoNodeLoaded(Node: TXmlNode);
|
|
procedure DoUnicodeLoss(Sender: TObject);
|
|
function GetCommentString: UTF8String;
|
|
procedure SetCommentString(const Value: UTF8String);
|
|
function GetEntityByName(AName: UTF8String): UTF8String;
|
|
function GetRoot: TXmlNode;
|
|
function GetEncodingString: UTF8String;
|
|
procedure SetEncodingString(const Value: UTF8String);
|
|
function GetVersionString: UTF8String;
|
|
procedure SetVersionString(const Value: UTF8String);
|
|
function GetStyleSheetNode: TXmlNode;
|
|
function GetUtf8Encoded: boolean;
|
|
protected
|
|
procedure CopyFrom(Source: TNativeXml); virtual;
|
|
procedure DoProgress(Size: integer);
|
|
function LineFeed: UTF8String; virtual;
|
|
procedure ParseDTD(ANode: TXmlNode; S: TStream); virtual;
|
|
procedure ReadFromStream(S: TStream); virtual;
|
|
procedure WriteToStream(S: TStream); virtual;
|
|
procedure SetDefaults; virtual;
|
|
public
|
|
// Create a new NativeXml document which can then be used to read or write XML files.
|
|
// A document that is created with Create must later be freed using Free.
|
|
// Example:
|
|
// <Code>
|
|
// var
|
|
// ADoc: TNativeXml;
|
|
// begin
|
|
// ADoc := TNativeXml.Create;
|
|
// try
|
|
// ADoc.LoadFromFile('c:\\temp\\myxml.xml');
|
|
// {do something with the document here}
|
|
// finally
|
|
// ADoc.Free;
|
|
// end;
|
|
// end;
|
|
// </Code>
|
|
constructor Create; virtual;
|
|
// Use CreateName to Create a new Xml document that will automatically
|
|
// contain a root element with name ARootName.
|
|
constructor CreateName(const ARootName: UTF8String); virtual;
|
|
// Destroy will free all data in the TNativeXml object. This includes the
|
|
// root node and all subnodes under it. Do not call Destroy directly, call
|
|
// Free instead.
|
|
destructor Destroy; override;
|
|
// When calling Assign with a Source object that is a TNativeXml, will cause
|
|
// it to copy all data from Source.
|
|
procedure Assign(Source: TPersistent); override;
|
|
// Call Clear to remove all data from the object, and restore all defaults.
|
|
procedure Clear; virtual;
|
|
// Function IsEmpty returns true if the root is clear, or in other words, the
|
|
// root contains no value, no name, no subnodes and no attributes.
|
|
function IsEmpty: boolean; virtual;
|
|
// Load an XML document from the TStream object in Stream. The LoadFromStream
|
|
// procedure will raise an exception of type EFilerError when it encounters
|
|
// non-wellformed XML. This method can be used with any TStream descendant.
|
|
// See also LoadFromFile and ReadFromString.
|
|
procedure LoadFromStream(Stream: TStream); virtual;
|
|
// Call procedure LoadFromFile to load an XML document from the filename
|
|
// specified. See Create for an example. The LoadFromFile procedure will raise
|
|
// an exception of type EFilerError when it encounters non-wellformed XML.
|
|
procedure LoadFromFile(const AFileName: string); virtual;
|
|
// Call procedure ReadFromString to load an XML document from the UTF8String AValue.
|
|
// The ReadFromString procedure will raise an exception of type EFilerError
|
|
// when it encounters non-wellformed XML.
|
|
procedure ReadFromString(const AValue: UTF8String); virtual;
|
|
// Call ResolveEntityReferences after the document has been loaded to resolve
|
|
// any present entity references (&Entity;). When an entity is found in the
|
|
// DTD, it will replace the entity reference. Whenever an entity contains
|
|
// XML markup, it will be parsed and become part of the document tree. Since
|
|
// calling ResolveEntityReferences is adding quite some extra overhead, it
|
|
// is not done automatically. If you want to do the entity replacement, a good
|
|
// moment to call ResolveEntityReferences is right after LoadFromFile.
|
|
procedure ResolveEntityReferences;
|
|
// Call SaveToStream to save the XML document to the Stream. Stream
|
|
// can be any TStream descendant. Set XmlFormat to xfReadable if you want
|
|
// the stream to contain indentations to make the XML more human-readable. This
|
|
// is not the default and also not compliant with the XML specification. See
|
|
// SaveToFile for information on how to save in special encoding.
|
|
procedure SaveToStream(Stream: TStream); virtual;
|
|
// Call SaveToFile to save the XML document to a file with FileName. If the
|
|
// filename exists, it will be overwritten without warning. If the file cannot
|
|
// be created, a standard I/O exception will be generated. Set XmlFormat to
|
|
// xfReadable if you want the file to contain indentations to make the XML
|
|
// more human-readable. This is not the default and also not compliant with
|
|
// the XML specification.<p>
|
|
// Saving to special encoding types can be achieved by setting two properties
|
|
// before saving:
|
|
// * ExternalEncoding
|
|
// * EncodingString
|
|
// ExternalEncoding can be se8bit (for plain ascii), seUtf8 (UTF-8), seUtf16LE
|
|
// (for unicode) or seUtf16BE (unicode big endian).<p> Do not forget to also
|
|
// set the EncodingString (e.g. "UTF-8" or "UTF-16") which matches with your
|
|
// ExternalEncoding.
|
|
procedure SaveToFile(const AFileName: string); virtual;
|
|
// Call WriteToString to save the XML document to a UTF8String. Set XmlFormat to
|
|
// xfReadable if you want the UTF8String to contain indentations to make the XML
|
|
// more human-readable. This is not the default and also not compliant with
|
|
// the XML specification.
|
|
function WriteToString: UTF8String; virtual;
|
|
// Set AbortParsing to True if you use the OnNodeNew and OnNodeLoaded events in
|
|
// a SAX-like manner, and you want to abort the parsing process halfway. Example:
|
|
// <code>
|
|
// procedure MyForm.NativeXmlNodeLoaded(Sender: TObject; Node: TXmlNode);
|
|
// begin
|
|
// if (Node.Name = 'LastNode') and (Sender is TNativeXml) then
|
|
// TNativeXml(Sender).AbortParsing := True;
|
|
// end;
|
|
// </code>
|
|
property AbortParsing: boolean read FAbortParsing write FAbortParsing;
|
|
// Choose what kind of binary encoding will be used when calling TXmlNode.BufferRead
|
|
// and TXmlNode.BufferWrite. Default value is xbeBase64.
|
|
property BinaryEncoding: TBinaryEncodingType read FBinaryEncoding write FBinaryEncoding;
|
|
// A comment string above the root element \<!--{comment}--\> can be accessed with
|
|
// this property. \Assign a comment to this property to add it to the XML document.
|
|
// Use property RootNodeList to add/insert/extract multiple comments.
|
|
property CommentString: UTF8String read GetCommentString write SetCommentString;
|
|
// Set DropCommentsOnParse if you're not interested in any comment nodes in your object
|
|
// model data. All comments encountered during parsing will simply be skipped and
|
|
// not added as a node with ElementType = xeComment (which is default). Note that
|
|
// when you set this option, you cannot later reconstruct an XML file with the comments
|
|
// back in place.
|
|
property DropCommentsOnParse: boolean read FDropCommentsOnParse write FDropCommentsOnParse;
|
|
// Encoding string (e.g. "UTF-8" or "UTF-16"). This encoding string is stored in
|
|
// the header.
|
|
// Example: In order to get this header:
|
|
// <?xml version="1.0" encoding="UTF-16" ?>
|
|
// enter this code:
|
|
// <CODE>MyXmlDocument.EncodingString := 'UTF-16';</CODE>
|
|
// When reading a file, EncodingString will contain the encoding used.
|
|
property EncodingString: UTF8String read GetEncodingString write SetEncodingString;
|
|
// Returns the value of the named entity in Name, where name should be stripped
|
|
// of the leading & and trailing ;. These entity values are parsed from the
|
|
// Doctype declaration (if any).
|
|
property EntityByName[AName: UTF8String]: UTF8String read GetEntityByName;
|
|
// ExternalEncoding defines in which format XML files are saved. Set ExternalEncoding
|
|
// to se8bit to save as plain text files, to seUtf8 to save as UTF8 files (with
|
|
// Byte Order Mark #EF BB FF) and to seUTF16LE to save as unicode (Byte Order
|
|
// Mark #FF FE). When reading an XML file, the value of ExternalEncoding will
|
|
// be set according to the byte order mark and/or encoding declaration found.
|
|
property ExternalEncoding: TStringEncodingType read FExternalEncoding write FExternalEncoding;
|
|
// When converting floating point values to strings (e.g. in WriteFloat),
|
|
// NativeXml will allow to output scientific notation in some cases, if the
|
|
// result is significantly shorter than normal output, but only if the value
|
|
// of FloatAllowScientific is True (default).
|
|
property FloatAllowScientific: boolean read FFloatAllowScientific write FFloatAllowScientific;
|
|
// When converting floating point values to strings (e.g. in WriteFloat),
|
|
// NativeXml will use this number of significant digits. The default is
|
|
// cDefaultFloatSignificantDigits, and set to 6.
|
|
property FloatSignificantDigits: integer read FFloatSignificantDigits write FFloatSignificantDigits;
|
|
// IndentString is the string used for indentations. By default, it is two
|
|
// spaces: ' '. Set IndentString to something else if you need to have
|
|
// specific indentation, or set it to an empty string to avoid indentation.
|
|
property IndentString: UTF8String read FIndentString write FIndentString;
|
|
// Root is the topmost element in the XML document. Access Root to read any
|
|
// child elements. When creating a new XML document, you can automatically
|
|
// include a Root node, by creating using CreateName.
|
|
property Root: TXmlNode read GetRoot;
|
|
// RootNodeList can be used to directly access the nodes in the root of the
|
|
// XML document. Usually this list consists of one declaration node followed
|
|
// by a normal node which is the Root. You can use this property to add or
|
|
// delete comments, stylesheets, dtd's etc.
|
|
property RootNodeList: TXmlNode read FRootNodes;
|
|
// Get the stylesheet node used for this XML document. If the node does not
|
|
// exist yet, it will be created (thus if you use this property, and don't
|
|
// set any of the attributes, an empty stylesheet node will be the result).
|
|
property StyleSheetNode: TXmlNode read GetStyleSheetNode;
|
|
// Set UseFullNodes to True before saving the XML document to ensure that all
|
|
// nodes are represented by <Node>...</Node> instead of the short version
|
|
// <Node/>. UseFullNodes is False by default.
|
|
property UseFullNodes: boolean read FUseFullNodes write FUseFullNodes;
|
|
// Set UseLocalBias to True if you want to consider the local timezone bias
|
|
// when writing and reading datetime values. UseLocalBias is False by default.
|
|
property UseLocalBias: Boolean read FUseLocalBias write FUseLocalBias;
|
|
// This property is here for backwards compat: all strings inside NativeXml
|
|
// are UTF8Strings, the internal encoding is always UTF8.
|
|
property Utf8Encoded: boolean read GetUtf8Encoded;
|
|
// After reading, this property contains the XML version (usually "1.0").
|
|
property VersionString: UTF8String read GetVersionString write SetVersionString;
|
|
// Set WriteOnDefault to False if you do not want to write default values to
|
|
// the XML document. This option can avoid creating huge documents with
|
|
// redundant info, and will speed up writing.
|
|
property WriteOnDefault: boolean read FWriteOnDefault write FWriteOnDefault;
|
|
// XmlFormat by default is set to xfCompact. This setting is compliant to the spec,
|
|
// and NativeXml will only generate XML files with #$0A as control AnsiCharacter.
|
|
// By setting XmlFormat to xfReadable, you can generate easily readable XML
|
|
// files that contain indentation and carriage returns after each element.
|
|
property XmlFormat: TXmlFormatType read FXmlFormat write FXmlFormat;
|
|
// ParserWarnings by default is True. If True, the parser will raise an
|
|
// exception in cases where the XML document is not technically valid. If False,
|
|
// the parser will try to ignore non-critical warnings. Set ParserWarnings
|
|
// to False for some types of XML-based documents such as SOAP messages.
|
|
property ParserWarnings: boolean read FParserWarnings write FParserWarnings;
|
|
// This event is called whenever a node's SortChildNodes method is called and
|
|
// no direct compare method is provided. Implement this event if you want to
|
|
// use object-event based methods for comparison of nodes.
|
|
property OnNodeCompare: TXmlNodeCompareEvent read FOnNodeCompare write FOnNodeCompare;
|
|
// This event is called whenever the parser has encountered a new node.
|
|
property OnNodeNew: TXmlNodeEvent read FOnNodeNew write FOnNodeNew;
|
|
// This event is called when the parser has finished parsing the node, and
|
|
// has created its complete contents in memory.
|
|
property OnNodeLoaded: TXmlNodeEvent read FOnNodeLoaded write FOnNodeLoaded;
|
|
// OnProgress is called during loading and saving of the XML document. The
|
|
// Size parameter contains the position in the stream. This event can be used
|
|
// to implement a progress indicator during loading and saving. The event is
|
|
// called after each node that is read or written.
|
|
property OnProgress: TXmlProgressEvent read FOnProgress write FOnProgress;
|
|
// This event is called if there is a warning for unicode conversion loss,
|
|
// when reading from Unicode streams or files.
|
|
property OnUnicodeLoss: TNotifyEvent read FOnUnicodeLoss write FOnUnicodeLoss;
|
|
end;
|
|
|
|
// This enumeration defines the conversion stream access mode.
|
|
TsdStreamModeType = (
|
|
umUnknown, // The stream access mode is not yet known
|
|
umRead, // UTF stream opened for reading
|
|
umWrite // UTF stream opened for writing
|
|
);
|
|
|
|
// TBigByteArray is an array of bytes like the standard TByteArray (windows
|
|
// unit) but which can contain up to MaxInt bytes. This type helps avoiding
|
|
// range check errors when working with buffers larger than 32768 bytes.
|
|
TBigByteArray = array[0..MaxInt - 1] of byte;
|
|
PBigByteArray = ^TBigByteArray;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
// not implemented
|
|
TsdBufferedStream = class(TStream)
|
|
private
|
|
FStream: TStream;
|
|
FOwned: Boolean;
|
|
protected
|
|
procedure SetSize(NewSize: Int64); override;
|
|
public
|
|
constructor Create(AStream: TStream; Owned: Boolean = False);
|
|
destructor Destroy; override;
|
|
function Read(var Buffer: array of Byte; Offset, Count: Longint): Longint; override;
|
|
function Write(const Buffer: array of Byte; Offset, Count: Longint): Longint; override;
|
|
function Seek(const Offset: Int64; Origin: TSeekOrigin): Int64; override;
|
|
end;
|
|
|
|
TsdBufferedReadStream = TsdBufferedStream;
|
|
|
|
TsdBufferedWriteStream = TsdBufferedStream;
|
|
|
|
{$ELSE}
|
|
|
|
// TsdBufferedReadStream is a buffered stream that takes another TStream
|
|
// and reads only buffer-wise from it, and reads to the stream are first
|
|
// done from the buffer. This stream type can only support reading.
|
|
TsdBufferedReadStream = class(TStream)
|
|
private
|
|
FStream: TStream;
|
|
FBuffer: PBigByteArray;
|
|
FPage: integer;
|
|
FBufPos: integer;
|
|
FBufSize: integer;
|
|
FPosition: longint;
|
|
FOwned: boolean;
|
|
FMustCheck: boolean;
|
|
protected
|
|
procedure CheckPosition;
|
|
public
|
|
// Create the buffered reader stream by passing the source stream in AStream,
|
|
// this source stream must already be initialized. If Owned is set to True,
|
|
// the source stream will be freed by TsdBufferedReadStream.
|
|
constructor Create(AStream: TStream; Owned: boolean = False);
|
|
destructor Destroy; override;
|
|
function Read(var Buffer; Count: Longint): Longint; override;
|
|
function Write(const Buffer; Count: Longint): Longint; override;
|
|
function Seek(Offset: Longint; Origin: Word): Longint; override;
|
|
end;
|
|
|
|
// TsdBufferedWriteStream is a buffered stream that takes another TStream
|
|
// and writes only buffer-wise to it, and writes to the stream are first
|
|
// done to the buffer. This stream type can only support writing.
|
|
TsdBufferedWriteStream = class(TStream)
|
|
private
|
|
FStream: TStream;
|
|
FBuffer: PBigByteArray;
|
|
FBufPos: integer;
|
|
FPosition: longint;
|
|
FOwned: boolean;
|
|
protected
|
|
procedure Flush;
|
|
public
|
|
// Create the buffered writer stream by passing the destination stream in AStream,
|
|
// this destination stream must already be initialized. If Owned is set to True,
|
|
// the destination stream will be freed by TsdBufferedWriteStream.
|
|
constructor Create(AStream: TStream; Owned: boolean = False);
|
|
destructor Destroy; override;
|
|
function Read(var Buffer; Count: Longint): Longint; override;
|
|
function Write(const Buffer; Count: Longint): Longint; override;
|
|
function Seek(Offset: Longint; Origin: Word): Longint; override;
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
// TsdCodecStream is the base codec class for reading and writing encoded files.
|
|
// See TsdUtf8Stream for more information.
|
|
TsdCodecStream = class(TStream)
|
|
private
|
|
FBuffer: UTF8String; // Buffer that holds temporary utf8 characters
|
|
FBufferPos: integer; // Current character in buffer
|
|
FEncoding: TStringEncodingType; // Type of string encoding used for the external stream
|
|
FMode: TsdStreamModeType; // Access mode of this UTF stream, determined after first read/write
|
|
FPosMin1: integer; // Position for seek(-1)
|
|
FPosMin2: integer; // Position for seek(-2)
|
|
FStream: TStream; // Referenced stream
|
|
FSwapByteOrder: boolean;
|
|
FWarningUnicodeLoss: boolean; // There was a warning for a unicode conversion loss
|
|
FWriteBom: boolean;
|
|
FOnUnicodeLoss: TNotifyEvent; // This event is called if there is a warning for unicode conversion loss
|
|
protected
|
|
function ReadByte: byte; virtual;
|
|
procedure StorePrevPositions; virtual;
|
|
procedure WriteByte(const B: byte); virtual;
|
|
procedure WriteBuf(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Offset, Count: longint); virtual;
|
|
function InternalRead(var Buffer{$IFDEF CLR}: array of Byte{$ENDIF}; Offset, Count: Longint): Longint;
|
|
function InternalSeek(Offset: Longint; Origin: TSeekOrigin): Longint;
|
|
function InternalWrite(const Buffer{$IFDEF CLR}: array of Byte{$ENDIF}; Offset, Count: Longint): Longint;
|
|
{$IFDEF CLR}
|
|
procedure SetSize(NewSize: Int64); override;
|
|
{$ENDIF}
|
|
public
|
|
// Call Create to create a new TsdCodectream based on an input or output stream
|
|
// in AStream. After the first Read, the input streamtype will be determined,
|
|
// and the Encoding property will be set accordingly. When using Write to
|
|
// write data to the referenced stream, the Encoding property must be set prior
|
|
// to this, indicating what kind of stream to produce.
|
|
constructor Create(AStream: TStream); virtual;
|
|
// Read Count bytes from the referenced stream, and put them in Buffer. The function
|
|
// returns the actual number of bytes read. The codec stream can only read
|
|
// one byte at the time!
|
|
{$IFDEF CLR}
|
|
function Read(var Buffer: array of Byte; Offset, Count: Longint): Longint; override;
|
|
{$ELSE}
|
|
function Read(var Buffer; Count: Longint): Longint; override;
|
|
{$ENDIF}
|
|
// Seek to a new position in the stream, with Origin as a reference. The codec
|
|
// stream can not seek when writing, and when reading can only go back one
|
|
// AnsiCharacter, or return a position. Position returned is the position
|
|
// in the referenced stream.
|
|
{$IFDEF CLR}
|
|
function Seek(const Offset: Int64; Origin: TSeekOrigin): Int64; override;
|
|
{$ELSE}
|
|
function Seek(Offset: Longint; Origin: Word): Longint; override;
|
|
{$ENDIF}
|
|
// Write Count bytes from Buffer to the referenced stream, The function
|
|
// returns the actual number of bytes written.
|
|
{$IFDEF CLR}
|
|
function Write(const Buffer: array of Byte; Offset, Count: Longint): Longint; override;
|
|
{$ELSE}
|
|
function Write(const Buffer; Count: Longint): Longint; override;
|
|
{$ENDIF}
|
|
// Set Encoding when writing to the preferred encoding of the output stream,
|
|
// or read Encoding after reading the output stream to determine encoding type.
|
|
property Encoding: TstringEncodingType read FEncoding write FEncoding;
|
|
// \Read this value after loading an XML file. It will be True if there was a
|
|
// warning for a unicode conversion loss.
|
|
property WarningUnicodeLoss: boolean read FWarningUnicodeLoss;
|
|
// This event is called if there is a warning for unicode conversion loss.
|
|
property OnUnicodeLoss: TNotifyEvent read FOnUnicodeLoss write FOnUnicodeLoss;
|
|
end;
|
|
|
|
// TsdUdf8tream is a conversion stream that will load ANSI, UTF8 or
|
|
// Unicode files and convert them into UTF8 only. The stream can
|
|
// also save UTF8 data as Ansi, UTF8 or Unicode.
|
|
TsdUtf8Stream = class(TsdCodecStream)
|
|
private
|
|
protected
|
|
function ReadByte: byte; override;
|
|
procedure WriteByte(const B: byte); override;
|
|
procedure WriteBuf(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Offset, Count: longint); override;
|
|
end;
|
|
|
|
// TsdSurplusReader is a simple class that can store a few surplus characters
|
|
// and returns these first before reading from the underlying stream
|
|
TsdSurplusReader = class
|
|
private
|
|
FStream: TStream;
|
|
FSurplus: UTF8String;
|
|
public
|
|
constructor Create(AStream: TStream);
|
|
property Surplus: UTF8String read FSurplus write FSurplus;
|
|
function ReadChar(var Ch: AnsiChar): integer;
|
|
function ReadCharSkipBlanks(var Ch: AnsiChar): boolean;
|
|
end;
|
|
|
|
// Simple string builder class that allocates string memory more effectively
|
|
// to avoid repeated re-allocation
|
|
TsdStringBuilder = class
|
|
private
|
|
FData: UTF8String;
|
|
FCurrentIdx: integer;
|
|
function GetData(Index: integer): AnsiChar;
|
|
procedure Reallocate(RequiredLength: integer);
|
|
public
|
|
constructor Create;
|
|
procedure Clear;
|
|
procedure AddChar(Ch: AnsiChar);
|
|
procedure AddString(var S: UTF8String);
|
|
function StringCopy(AFirst, ALength: integer): UTF8String;
|
|
function Value: UTF8String;
|
|
property Length: integer read FCurrentIdx;
|
|
property Data[Index: integer]: AnsiChar read GetData; default;
|
|
end;
|
|
|
|
// String functions
|
|
|
|
function sdUTF8StringReplace(const S, OldPattern, NewPattern: UTF8String): UTF8String;
|
|
|
|
// Escape all required characters in string AValue.
|
|
function sdUTF8EscapeString(const AValue: UTF8String): UTF8String;
|
|
|
|
// Replace all escaped characters in string AValue by their original. This includes
|
|
// character references using &#...; and &#x...;
|
|
function sdUTF8UnEscapeString(const AValue: UTF8String): UTF8String;
|
|
|
|
// Enclose the string AValue in quotes.
|
|
function sdUTF8QuotedString(const AValue: UTF8String): UTF8String;
|
|
|
|
// Remove the quotes from string AValue.
|
|
function sdUTF8UnQuotedString(const AValue: UTF8String): UTF8String;
|
|
|
|
// This function adds control characters Chars repeatedly after each Interval
|
|
// of characters to UTF8String Value.
|
|
function sdAddControlChars(const AValue: UTF8String; const Chars: UTF8String; Interval: integer): UTF8String;
|
|
|
|
// This function removes control characters from UTF8String AValue (Tab, CR, LF and Space)
|
|
function sdRemoveControlChars(const AValue: UTF8String): UTF8String;
|
|
|
|
// Convert the UTF8String ADate to a TDateTime according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
// If there is a conversion error, an exception will be raised.
|
|
function sdDateTimeFromString(const ADate: UTF8String; UseLocalBias: Boolean = False): TDateTime;
|
|
|
|
// Convert the UTF8String ADate to a TDateTime according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
// If there is a conversion error, the default value ADefault is returned.
|
|
function sdDateTimeFromStringDefault(const ADate: UTF8String; ADefault: TDateTime;
|
|
UseLocalBias: Boolean = False): TDateTime;
|
|
|
|
// Convert the TDateTime ADate to a UTF8String according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
function sdDateTimeToString(ADate: TDateTime; UseLocalBias: Boolean = False): UTF8String;
|
|
|
|
// Convert a number to a UTF8String, using SignificantDigits to indicate the number of
|
|
// significant digits, and AllowScientific to allow for scientific notation if that
|
|
// results in much shorter notatoin.
|
|
function sdWriteNumber(Value: double; SignificantDigits: integer; AllowScientific: boolean): UTF8String;
|
|
|
|
// Write an UTF8String to the stream
|
|
procedure sdUTF8WriteStringToStream(S: TStream; const AString: UTF8String);
|
|
|
|
// Turn Ch to an UpCase character ('a'..'z' becomes 'A'..'Z')
|
|
function sdUpCase(Ch: AnsiChar): AnsiChar;
|
|
|
|
// Conversion between Ansi, UTF8 and Unicode
|
|
|
|
// Convert a UnicodeString to a UTF8 encoded string
|
|
function sdUnicodeToUtf8(const W: UnicodeString): UTF8String;
|
|
|
|
// Convert a AnsiString to a UTF8 encoded string
|
|
function sdAnsiToUtf8(const S: AnsiString): UTF8String;
|
|
|
|
// Convert a UTF8 encoded string to a UnicodeString
|
|
function sdUtf8ToUnicode(const S: UTF8String): UnicodeString;
|
|
|
|
// Convert a UTF8 encoded string to a AnsiString. This might cause loss!
|
|
function sdUtf8ToAnsi(const S: UTF8String): AnsiString;
|
|
|
|
|
|
// parse functions
|
|
|
|
// Find SubString within UTF8String S, only process characters between Start and Close.
|
|
// First occurrance is reported in APos. If something is found, function returns True.
|
|
function sdUTF8FindString(const SubString, S: UTF8String; Start, Close: integer; var APos: integer): boolean;
|
|
|
|
// Detect if the SubString matches the characters in S from position Start. S may be
|
|
// actually longer than SubString, only length(SubString) characters are checked.
|
|
function sdUTF8MatchString(const SubString: UTF8String; const S: UTF8String; Start: integer): boolean;
|
|
|
|
// Find all Name="Value" pairs in UTF8String AValue (from Start to Close - 1), and put
|
|
// the resulting attributes in stringlist Attributes. This stringlist must already
|
|
// be initialized when calling this function.
|
|
procedure sdUTF8ParseAttributes(const AValue: UTF8String; Start, Close: integer; Attributes: TsdUTF8StringList);
|
|
|
|
// Trim the UTF8String AValue between Start and Close - 1 (remove whitespaces at start
|
|
// and end), not by adapting the UTF8String but by adjusting the Start and Close indices.
|
|
// If the resulting UTF8String still has a length > 0, the function returns True.
|
|
function sdUTF8TrimPos(const AValue: UTF8String; var Start, Close: integer): boolean;
|
|
|
|
// Trim the UTF8String
|
|
function sdUTF8Trim(const AValue: UTF8String): UTF8String;
|
|
|
|
// Encoding/Decoding functions
|
|
|
|
// Encode binary data in Source as BASE64. The function returns the BASE64 encoded
|
|
// data as UTF8String, without any linebreaks.
|
|
function EncodeBase64(const Source: RawByteString): UTF8String;
|
|
|
|
// Decode BASE64 data in Source into binary data. The function returns the binary
|
|
// data as UTF8String. Use a TStringStream to convert this data to a stream. The Source
|
|
// UTF8String may contain linebreaks and control characters, these will be stripped.
|
|
function DecodeBase64(const Source: UTF8String): RawByteString;
|
|
|
|
// Encode binary data in Source as BINHEX. The function returns the BINHEX encoded
|
|
// data as UTF8String, without any linebreaks.
|
|
function EncodeBinHex(const Source: RawByteString): UTF8String;
|
|
|
|
// Decode BINHEX data in Source into binary data. The function returns the binary
|
|
// data as UTF8String. Use a TStringStream to convert this data to a stream. The Source
|
|
// UTF8String may contain linebreaks and control characters, these will be stripped.
|
|
function DecodeBinHex(const Source: UTF8String): RawByteString;
|
|
|
|
resourcestring
|
|
|
|
sxeErrorCalcStreamLength = 'Error while calculating streamlength';
|
|
sxeMissingDataInBinaryStream = 'Missing data in binary stream';
|
|
sxeMissingElementName = 'Missing element name';
|
|
sxeMissingCloseTag = 'Missing close tag in element %s';
|
|
sxeMissingDataAfterGreaterThan = 'Missing data after "<" in element %s';
|
|
sxeMissingLessThanInCloseTag = 'Missing ">" in close tag of element %s';
|
|
sxeIncorrectCloseTag = 'Incorrect close tag in element %s';
|
|
sxeIllegalCharInNodeName = 'Illegal character in node name "%s"';
|
|
sxeMoreThanOneRootElement = 'More than one root element found in xml';
|
|
sxeMoreThanOneDeclaration = 'More than one xml declaration found in xml';
|
|
sxeDeclarationMustBeFirstElem = 'Xml declaration must be first element';
|
|
sxeMoreThanOneDoctype = 'More than one doctype declaration found in root';
|
|
sxeDoctypeAfterRootElement = 'Doctype declaration found after root element';
|
|
sxeNoRootElement = 'No root element found in xml';
|
|
sxeIllegalElementType = 'Illegal element type';
|
|
sxeCDATAInRoot = 'No CDATA allowed in root';
|
|
sxeRootElementNotDefined = 'XML root element not defined.';
|
|
sxeCodecStreamNotAssigned = 'Encoding stream unassigned';
|
|
sxeUnsupportedEncoding = 'Unsupported string encoding';
|
|
sxeCannotReadCodecForWriting = 'Cannot read from a conversion stream opened for writing';
|
|
sxeCannotWriteCodecForReading = 'Cannot write to an UTF stream opened for reading';
|
|
sxeCannotReadMultipeChar = 'Cannot read multiple chars from conversion stream at once';
|
|
sxeCannotPerformSeek = 'Cannot perform seek on codec stream';
|
|
sxeCannotSeekBeforeReadWrite = 'Cannot seek before reading or writing in conversion stream';
|
|
sxeCannotSeek = 'Cannot perform seek in conversion stream';
|
|
sxeCannotWriteToOutputStream = 'Cannot write to output stream';
|
|
sxeXmlNodeNotAssigned = 'XML Node is not assigned';
|
|
sxeCannotConverToBool = 'Cannot convert value to bool';
|
|
sxeCannotConvertToFloat = 'Cannot convert value to float';
|
|
sxeSignificantDigitsOutOfRange = 'Significant digits out of range';
|
|
|
|
implementation
|
|
|
|
type
|
|
|
|
// Internal type
|
|
TTagType = record
|
|
Start: UTF8String;
|
|
Close: UTF8String;
|
|
Style: TXmlElementType;
|
|
end;
|
|
PByte = ^byte;
|
|
|
|
TBomInfo = packed record
|
|
BOM: array[0..3] of byte;
|
|
Len: integer;
|
|
Encoding: TStringEncodingType;
|
|
HasBOM: boolean;
|
|
end;
|
|
|
|
const
|
|
|
|
// Count of different escape characters
|
|
cEscapeCount = 5;
|
|
|
|
// These are characters that must be escaped. Note that "&" is first since
|
|
// when another would be replaced first (eg ">" by "<") this could
|
|
// cause the new "&" in "<" to be replaced by "&";
|
|
cEscapes: array[0..cEscapeCount - 1] of UTF8String =
|
|
('&', '<', '>', '''', '"');
|
|
|
|
// These are the strings that replace the escape strings - in the same order
|
|
cReplaces: array[0..cEscapeCount - 1] of UTF8String =
|
|
('&', '<', '>', ''', '"');
|
|
|
|
cQuoteChars: set of AnsiChar = ['"', ''''];
|
|
cControlChars: set of AnsiChar = [#9, #10, #13, #32]; {Tab, LF, CR, Space}
|
|
|
|
// Count of different XML tags
|
|
cTagCount = 12;
|
|
|
|
cTags: array[0..cTagCount - 1] of TTagType = (
|
|
// The order is important here; the items are searched for in appearing order
|
|
(Start: '<![CDATA['; Close: ']]>'; Style: xeCData),
|
|
(Start: '<!DOCTYPE'; Close: '>'; Style: xeDoctype),
|
|
(Start: '<!ELEMENT'; Close: '>'; Style: xeElement),
|
|
(Start: '<!ATTLIST'; Close: '>'; Style: xeAttList),
|
|
(Start: '<!ENTITY'; Close: '>'; Style: xeEntity),
|
|
(Start: '<!NOTATION'; Close: '>'; Style: xeNotation),
|
|
(Start: '<?xml-stylesheet'; Close: '?>'; Style: xeStylesheet),
|
|
(Start: '<?xml'; Close: '?>'; Style: xeDeclaration),
|
|
(Start: '<!--'; Close: '-->'; Style: xeComment),
|
|
(Start: '<!'; Close: '>'; Style: xeExclam),
|
|
(Start: '<?'; Close: '?>'; Style: xeQuestion),
|
|
(Start: '<'; Close: '>'; Style: xeNormal) );
|
|
// direct tags are derived from Normal tags by checking for the />
|
|
|
|
// These constant are used when generating hexchars from buffer data
|
|
cHexChar: array[0..15] of AnsiChar = '0123456789ABCDEF';
|
|
cHexCharLoCase: array[0..15] of AnsiChar = '0123456789abcdef';
|
|
|
|
// These AnsiCharacters are used when generating BASE64 AnsiChars from buffer data
|
|
cBase64Char: array[0..63] of AnsiChar =
|
|
'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/';
|
|
cBase64PadChar: AnsiChar = '=';
|
|
|
|
// The amount of bytes to allocate with each increase of the value buffer
|
|
cNodeValueBuf = 2048;
|
|
|
|
// byte order marks for strings
|
|
// Unicode text files should contain $FFFE as first character to identify such a file clearly. Depending on the system
|
|
// where the file was created on this appears either in big endian or little endian style.
|
|
|
|
const cBomInfoCount = 15;
|
|
const cBomInfo: array[0..cBomInfoCount - 1] of TBomInfo =
|
|
( (BOM: ($00,$00,$FE,$FF); Len: 4; Encoding: seUCS4BE; HasBOM: true),
|
|
(BOM: ($FF,$FE,$00,$00); Len: 4; Encoding: seUCS4LE; HasBOM: true),
|
|
(BOM: ($00,$00,$FF,$FE); Len: 4; Encoding: seUCS4_2143; HasBOM: true),
|
|
(BOM: ($FE,$FF,$00,$00); Len: 4; Encoding: seUCS4_3412; HasBOM: true),
|
|
(BOM: ($FE,$FF,$00,$00); Len: 2; Encoding: seUTF16BE; HasBOM: true),
|
|
(BOM: ($FF,$FE,$00,$00); Len: 2; Encoding: seUTF16LE; HasBOM: true),
|
|
(BOM: ($EF,$BB,$BF,$00); Len: 3; Encoding: seUTF8; HasBOM: true),
|
|
(BOM: ($00,$00,$00,$3C); Len: 4; Encoding: seUCS4BE; HasBOM: false),
|
|
(BOM: ($3C,$00,$00,$00); Len: 4; Encoding: seUCS4LE; HasBOM: false),
|
|
(BOM: ($00,$00,$3C,$00); Len: 4; Encoding: seUCS4_2143; HasBOM: false),
|
|
(BOM: ($00,$3C,$00,$00); Len: 4; Encoding: seUCS4_3412; HasBOM: false),
|
|
(BOM: ($00,$3C,$00,$3F); Len: 4; Encoding: seUTF16BE; HasBOM: false),
|
|
(BOM: ($3C,$00,$3F,$00); Len: 4; Encoding: seUTF16LE; HasBOM: false),
|
|
(BOM: ($3C,$3F,$78,$6D); Len: 4; Encoding: seAnsi; HasBOM: false),
|
|
(BOM: ($4C,$6F,$A7,$94); Len: 4; Encoding: seEBCDIC; HasBOM: false)
|
|
);
|
|
|
|
// .NET compatible stub for TBytes (array of byte) type
|
|
{$IFNDEF CLR}
|
|
type
|
|
TBytes = TBigByteArray;
|
|
{$ENDIF}
|
|
|
|
function StrScan(const Str: PAnsiChar; Chr: AnsiChar): PAnsiChar;
|
|
begin
|
|
Result := Str;
|
|
while Result^ <> Chr do
|
|
begin
|
|
if Result^ = #0 then
|
|
begin
|
|
Result := nil;
|
|
Exit;
|
|
end;
|
|
Inc(Result);
|
|
end;
|
|
end;
|
|
|
|
function UTF8QuotedStr(const S: UTF8String; Quote: AnsiChar): UTF8String;
|
|
var
|
|
P, Src, Dest: PAnsiChar;
|
|
AddCount: Integer;
|
|
begin
|
|
AddCount := 0;
|
|
P := StrScan(PAnsiChar(S), Quote);
|
|
while P <> nil do
|
|
begin
|
|
Inc(P);
|
|
Inc(AddCount);
|
|
P := StrScan(P, Quote);
|
|
end;
|
|
if AddCount = 0 then
|
|
begin
|
|
Result := UTF8String(Quote) + S + UTF8String(Quote);
|
|
Exit;
|
|
end;
|
|
SetLength(Result, Length(S) + AddCount + 2);
|
|
Dest := Pointer(Result);
|
|
Dest^ := Quote;
|
|
Inc(Dest);
|
|
Src := Pointer(S);
|
|
P := StrScan(Src, Quote);
|
|
repeat
|
|
Inc(P);
|
|
Move(Src^, Dest^, P - Src);
|
|
Inc(Dest, P - Src);
|
|
Dest^ := Quote;
|
|
Inc(Dest);
|
|
Src := P;
|
|
P := StrScan(Src, Quote);
|
|
until P = nil;
|
|
P := StrEnd(Src);
|
|
Move(Src^, Dest^, P - Src);
|
|
Inc(Dest, P - Src);
|
|
Dest^ := Quote;
|
|
end;
|
|
|
|
function UTF8ExtractQuotedStr(const S: UTF8String; Quote: AnsiChar): UTF8String;
|
|
var
|
|
P, Src, Dest: PAnsiChar;
|
|
DropCount: Integer;
|
|
begin
|
|
Result := '';
|
|
Src := PAnsiChar(S);
|
|
if (Src = nil) or (Src^ <> Quote) then
|
|
Exit;
|
|
Inc(Src);
|
|
DropCount := 1;
|
|
P := Src;
|
|
Src := StrScan(Src, Quote);
|
|
while Src <> nil do
|
|
begin
|
|
Inc(Src);
|
|
if Src^ <> Quote then
|
|
Break;
|
|
Inc(Src);
|
|
Inc(DropCount);
|
|
Src := StrScan(Src, Quote);
|
|
end;
|
|
if Src = nil then
|
|
Src := StrEnd(P);
|
|
if ((Src - P) <= 1) then
|
|
Exit;
|
|
if DropCount = 1 then
|
|
SetString(Result, P, Src - P - 1)
|
|
else
|
|
begin
|
|
SetLength(Result, Src - P - DropCount);
|
|
Dest := PAnsiChar(Result);
|
|
Src := StrScan(P, Quote);
|
|
while Src <> nil do
|
|
begin
|
|
Inc(Src);
|
|
if Src^ <> Quote then
|
|
Break;
|
|
Move(P^, Dest^, Src - P);
|
|
Inc(Dest, Src - P);
|
|
Inc(Src);
|
|
P := Src;
|
|
Src := StrScan(Src, Quote);
|
|
end;
|
|
if Src = nil then
|
|
Src := StrEnd(P);
|
|
Move(P^, Dest^, Src - P - 1);
|
|
end;
|
|
end;
|
|
|
|
function Utf8Pos(const Substr, S: UTF8String): Integer;
|
|
var
|
|
i, x: Integer;
|
|
Len, LenSubStr: Integer;
|
|
begin
|
|
i := 1;
|
|
LenSubStr := Length(SubStr);
|
|
Len := Length(S) - LenSubStr + 1;
|
|
while i <= Len do
|
|
begin
|
|
if S[i] = SubStr[1] then
|
|
begin
|
|
x := 1;
|
|
while (x < LenSubStr) and (S[i + x] = SubStr[x + 1]) do
|
|
Inc(x);
|
|
if (x = LenSubStr) then
|
|
begin
|
|
Result := i;
|
|
exit;
|
|
end;
|
|
end;
|
|
Inc(i);
|
|
end;
|
|
Result := 0;
|
|
end;
|
|
|
|
// .NET-compatible TStream.Write
|
|
|
|
function StreamWrite(Stream: TStream; const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Offset, Count: Longint): Longint;
|
|
begin
|
|
{$IFDEF CLR}
|
|
Result := Stream.Write(Buffer, Offset, Count);
|
|
{$ELSE}
|
|
Result := Stream.Write(TBytes(Buffer)[Offset], Count);
|
|
{$ENDIF}
|
|
end;
|
|
|
|
{$IFNDEF CLR}
|
|
// Delphi's implementation of TStringStream is severely flawed, it does a SetLength
|
|
// on each write, which slows down everything to a crawl. This implementation over-
|
|
// comes this issue.
|
|
type
|
|
TsdUTF8StringStream = class(TMemoryStream)
|
|
public
|
|
constructor Create(const S: UTF8String);
|
|
function DataString: UTF8String;
|
|
end;
|
|
|
|
constructor TsdUTF8StringStream.Create(const S: UTF8String);
|
|
begin
|
|
inherited Create;
|
|
SetSize(length(S));
|
|
if Size > 0 then
|
|
begin
|
|
Write(S[1], Size);
|
|
Position := 0;
|
|
end;
|
|
end;
|
|
|
|
function TsdUTF8StringStream.DataString: UTF8String;
|
|
begin
|
|
SetLength(Result, Size);
|
|
if Size > 0 then
|
|
begin
|
|
Position := 0;
|
|
Read(Result[1], length(Result));
|
|
end;
|
|
end;
|
|
{$ELSE}
|
|
// In .NET we use the standard TStringStream
|
|
type
|
|
TsdUTF8StringStream = TStringStream;
|
|
{$ENDIF}
|
|
|
|
// Utility functions
|
|
|
|
function Min(A, B: integer): integer;
|
|
begin
|
|
if A < B then
|
|
Result := A
|
|
else
|
|
Result := B;
|
|
end;
|
|
|
|
function Max(A, B: integer): integer;
|
|
begin
|
|
if A > B then
|
|
Result := A
|
|
else
|
|
Result := B;
|
|
end;
|
|
|
|
function sdUTF8StringReplace(const S, OldPattern, NewPattern: UTF8String): UTF8String;
|
|
var
|
|
SearchStr, NewStr: UTF8String;
|
|
Offset: Integer;
|
|
begin
|
|
// Case Sensitive, Replace All
|
|
SearchStr := S;
|
|
NewStr := S;
|
|
Result := '';
|
|
while SearchStr <> '' do
|
|
begin
|
|
Offset := UTF8Pos(OldPattern, SearchStr);
|
|
if Offset = 0 then
|
|
begin
|
|
Result := Result + NewStr;
|
|
Break;
|
|
end;
|
|
Result := Result + Copy(NewStr, 1, Offset - 1) + NewPattern;
|
|
NewStr := Copy(NewStr, Offset + Length(OldPattern), MaxInt);
|
|
SearchStr := Copy(SearchStr, Offset + Length(OldPattern), MaxInt);
|
|
end;
|
|
end;
|
|
|
|
function sdUTF8EscapeString(const AValue: UTF8String): UTF8String;
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := AValue;
|
|
for i := 0 to cEscapeCount - 1 do
|
|
Result := sdUTF8StringReplace(Result, cEscapes[i], cReplaces[i]);
|
|
end;
|
|
|
|
function sdUTF8UnEscapeString(const AValue: UTF8String): UTF8String;
|
|
var
|
|
SearchStr, Reference, Replace: UTF8String;
|
|
i, Offset, Code: Integer;
|
|
W: word;
|
|
begin
|
|
SearchStr := AValue;
|
|
Result := '';
|
|
while SearchStr <> '' do
|
|
begin
|
|
// find '&'
|
|
Offset := Utf8Pos('&', SearchStr);
|
|
if Offset = 0 then
|
|
begin
|
|
// Nothing found
|
|
Result := Result + SearchStr;
|
|
Break;
|
|
end;
|
|
Result := Result + Copy(SearchStr, 1, Offset - 1);
|
|
SearchStr := Copy(SearchStr, Offset, MaxInt);
|
|
// find next ';'
|
|
Offset := Utf8Pos(';', SearchStr);
|
|
if Offset = 0 then
|
|
begin
|
|
// Error: encountered a '&' but not a ';'.. we will ignore, just return
|
|
// the unmodified value
|
|
Result := Result + SearchStr;
|
|
Break;
|
|
end;
|
|
// Reference
|
|
Reference := copy(SearchStr, 1, Offset);
|
|
SearchStr := Copy(SearchStr, Offset + 1, MaxInt);
|
|
Replace := Reference;
|
|
// See if it is a Character reference
|
|
if copy(Reference, 1, 2) = '&#' then
|
|
begin
|
|
Reference := copy(Reference, 3, length(Reference) - 3);
|
|
if length(Reference) > 0 then
|
|
begin
|
|
if sdUpCase(Reference[1]) = 'X' then
|
|
// Hex notation
|
|
Reference[1] := '$';
|
|
Code := StrToIntDef(string(Reference), -1);
|
|
if (Code >= 0) and (Code < $FFFF) then
|
|
begin
|
|
W := Code;
|
|
Replace := sdUnicodeToUtf8(UnicodeChar(W));
|
|
end;
|
|
end;
|
|
end else
|
|
begin
|
|
// Look up default escapes
|
|
for i := 0 to cEscapeCount - 1 do
|
|
if Reference = cReplaces[i] then
|
|
begin
|
|
// Replace
|
|
Replace := cEscapes[i];
|
|
Break;
|
|
end;
|
|
end;
|
|
// New result
|
|
Result := Result + Replace;
|
|
end;
|
|
end;
|
|
|
|
function sdUTF8QuotedString(const AValue: UTF8String): UTF8String;
|
|
var
|
|
Quote: AnsiChar;
|
|
begin
|
|
Quote := '"';
|
|
if UTF8Pos('"', AValue) > 0 then
|
|
Quote := '''';
|
|
{$IFDEF CLR}
|
|
Result := QuotedStr(AValue, AQuoteChar);
|
|
{$ELSE}
|
|
Result := UTF8QuotedStr(AValue, Quote);
|
|
{$ENDIF}
|
|
end;
|
|
|
|
function sdUTF8UnQuotedString(const AValue: UTF8String): UTF8String;
|
|
var
|
|
Quote: AnsiChar;
|
|
begin
|
|
if Length(AValue) < 2 then
|
|
begin
|
|
Result := AValue;
|
|
exit;
|
|
end;
|
|
Quote := AValue[1];
|
|
if Quote in cQuoteChars then
|
|
begin
|
|
{$IFDEF CLR}
|
|
Result := DequotedStr(AValue, Quote);
|
|
{$ELSE}
|
|
Result := UTF8ExtractQuotedStr(AValue, Quote);
|
|
{$ENDIF}
|
|
end else
|
|
Result := AValue;
|
|
end;
|
|
|
|
function sdAddControlChars(const AValue: UTF8String; const Chars: UTF8String; Interval: integer): UTF8String;
|
|
// Insert AnsiChars in AValue at each Interval AnsiChars
|
|
var
|
|
i, j, ALength: integer;
|
|
// local
|
|
procedure InsertControlChars;
|
|
var
|
|
k: integer;
|
|
begin
|
|
for k := 1 to Length(Chars) do
|
|
begin
|
|
Result[j] := Chars[k];
|
|
inc(j);
|
|
end;
|
|
end;
|
|
// main
|
|
begin
|
|
if (Length(Chars) = 0) or (Interval <= 0) then
|
|
begin
|
|
Result := AValue;
|
|
exit;
|
|
end;
|
|
|
|
// Calculate length based on original length and total extra length for control AnsiChars
|
|
ALength := Length(AValue) + ((Length(AValue) - 1) div Interval + 3) * Length(Chars);
|
|
SetLength(Result, ALength);
|
|
|
|
// Copy and insert
|
|
j := 1;
|
|
for i := 1 to Length(AValue) do
|
|
begin
|
|
if (i mod Interval) = 1 then
|
|
// Insert control AnsiChars
|
|
InsertControlChars;
|
|
Result[j] := AValue[i];
|
|
inc(j);
|
|
end;
|
|
InsertControlChars;
|
|
|
|
// Adjust length
|
|
dec(j);
|
|
if ALength > j then
|
|
SetLength(Result, j);
|
|
end;
|
|
|
|
function sdRemoveControlChars(const AValue: UTF8String): UTF8String;
|
|
// Remove control characters from UTF8String in AValue
|
|
var
|
|
i, j: integer;
|
|
begin
|
|
Setlength(Result, Length(AValue));
|
|
i := 1;
|
|
j := 1;
|
|
while i <= Length(AValue) do
|
|
if AValue[i] in cControlChars then
|
|
inc(i)
|
|
else
|
|
begin
|
|
Result[j] := AValue[i];
|
|
inc(i);
|
|
inc(j);
|
|
end;
|
|
// Adjust length
|
|
if i <> j then
|
|
SetLength(Result, j - 1);
|
|
end;
|
|
|
|
function sdUTF8FindString(const SubString, S: UTF8String; Start, Close: integer; var APos: integer): boolean;
|
|
// Check if the Substring matches the UTF8String S in any position in interval Start to Close - 1
|
|
// and returns found positon in APos. Result = True if anything is found.
|
|
// Note: this funtion is case-insensitive
|
|
var
|
|
CharIndex: integer;
|
|
begin
|
|
Result := False;
|
|
APos := 0;
|
|
for CharIndex := Start to Close - Length(SubString) do
|
|
if sdUTF8MatchString(SubString, S, CharIndex) then
|
|
begin
|
|
APos := CharIndex;
|
|
Result := True;
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
function UTF8CompareText(const S1, S2: UTF8String): integer;
|
|
begin
|
|
Result := AnsiCompareText(string(S1), string(S2));
|
|
end;
|
|
|
|
function IntToUTF8Str(Value: integer): UTF8String;
|
|
begin
|
|
Result := UTF8String(IntToStr(Value));
|
|
end;
|
|
|
|
function Int64ToUTF8Str(Value: int64): UTF8String;
|
|
begin
|
|
Result := UTF8String(IntToStr(Value));
|
|
end;
|
|
|
|
function sdUTF8MatchString(const SubString: UTF8String; const S: UTF8String; Start: integer): boolean;
|
|
// Check if the Substring matches the string S at position Start.
|
|
// Note: this funtion is case-insensitive
|
|
var
|
|
CharIndex: integer;
|
|
begin
|
|
Result := False;
|
|
// Check range just in case
|
|
if (Length(S) - Start + 1) < Length(Substring) then
|
|
exit;
|
|
|
|
CharIndex := 0;
|
|
while CharIndex < Length(SubString) do
|
|
if sdUpCase(SubString[CharIndex + 1]) = sdUpCase(S[Start + CharIndex]) then
|
|
inc(CharIndex)
|
|
else
|
|
exit;
|
|
// All AnsiChars were the same, so we succeeded
|
|
Result := True;
|
|
end;
|
|
|
|
procedure sdUTF8ParseAttributes(const AValue: UTF8String; Start, Close: integer; Attributes: TsdUTF8StringList);
|
|
// Convert the attributes string AValue in [Start, Close - 1] to the attributes Stringlist
|
|
var
|
|
i: integer;
|
|
InQuotes: boolean;
|
|
Quote: AnsiChar;
|
|
begin
|
|
InQuotes := False;
|
|
Quote := '"';
|
|
if not assigned(Attributes) then
|
|
exit;
|
|
if not sdUTF8TrimPos(AValue, Start, Close) then
|
|
exit;
|
|
|
|
// Clear first
|
|
Attributes.Clear;
|
|
|
|
// Loop through characters
|
|
for i := Start to Close - 1 do
|
|
begin
|
|
|
|
// In quotes?
|
|
if InQuotes then
|
|
begin
|
|
if AValue[i] = Quote then
|
|
InQuotes := False;
|
|
end else
|
|
begin
|
|
if AValue[i] in cQuoteChars then
|
|
begin
|
|
InQuotes := True;
|
|
Quote := AValue[i];
|
|
end;
|
|
end;
|
|
|
|
// Add attribute strings on each controlchar break
|
|
if not InQuotes then
|
|
if AValue[i] in cControlChars then
|
|
begin
|
|
if i > Start then
|
|
Attributes.Add(copy(AValue, Start, i - Start));
|
|
Start := i + 1;
|
|
end;
|
|
end;
|
|
|
|
// Add last attribute string
|
|
if Start < Close then
|
|
Attributes.Add(copy(AValue, Start, Close - Start));
|
|
|
|
// First-char "=" signs should append to previous
|
|
for i := Attributes.Count - 1 downto 1 do
|
|
if Attributes[i][1] = '=' then
|
|
begin
|
|
Attributes[i - 1] := Attributes[i - 1] + Attributes[i];
|
|
Attributes.Delete(i);
|
|
end;
|
|
|
|
// First-char quotes should append to previous
|
|
for i := Attributes.Count - 1 downto 1 do
|
|
if (Attributes[i][1] in cQuoteChars) and (UTF8Pos('=', Attributes[i - 1]) > 0) then
|
|
begin
|
|
Attributes[i - 1] := Attributes[i - 1] + Attributes[i];
|
|
Attributes.Delete(i);
|
|
end;
|
|
end;
|
|
|
|
function sdUTF8TrimPos(const AValue: UTF8String; var Start, Close: integer): boolean;
|
|
// Trim the string in AValue in [Start, Close - 1] by adjusting Start and Close variables
|
|
begin
|
|
// Checks
|
|
Start := Max(1, Start);
|
|
Close := Min(Length(AValue) + 1, Close);
|
|
if Close <= Start then
|
|
begin
|
|
Result := False;
|
|
exit;
|
|
end;
|
|
|
|
// Trim left
|
|
while
|
|
(Start < Close) and
|
|
(AValue[Start] in cControlChars) do
|
|
inc(Start);
|
|
|
|
// Trim right
|
|
while
|
|
(Start < Close) and
|
|
(AValue[Close - 1] in cControlChars) do
|
|
dec(Close);
|
|
|
|
// Do we have a string left?
|
|
Result := Close > Start;
|
|
end;
|
|
|
|
function sdUTF8Trim(const AValue: UTF8String): UTF8String;
|
|
var
|
|
Start, Close: integer;
|
|
Res: boolean;
|
|
begin
|
|
Start := 1;
|
|
Close := length(AValue) + 1;
|
|
Res := sdUTF8TrimPos(AValue, Start, Close);
|
|
if Res then
|
|
Result := Copy(AValue, Start, Close - Start)
|
|
else
|
|
Result := '';
|
|
end;
|
|
|
|
procedure sdUTF8WriteStringToStream(S: TStream; const AString: UTF8String);
|
|
begin
|
|
if Length(AString) > 0 then
|
|
begin
|
|
{$IFDEF CLR}
|
|
S.Write(BytesOf(AString), Length(AString));
|
|
{$ELSE}
|
|
S.Write(AString[1], Length(AString));
|
|
{$ENDIF}
|
|
end;
|
|
end;
|
|
|
|
function sdUpCase(Ch: AnsiChar): AnsiChar;
|
|
begin
|
|
Result := Ch;
|
|
case Result of
|
|
'a'..'z': Dec(Result, Ord('a') - Ord('A'));
|
|
end;
|
|
end;
|
|
|
|
function ReadOpenTag(AReader: TsdSurplusReader): integer;
|
|
// Try to read the type of open tag from S
|
|
var
|
|
AIndex, i: integer;
|
|
Found: boolean;
|
|
Ch: AnsiChar;
|
|
Candidates: array[0..cTagCount - 1] of boolean;
|
|
Surplus: UTF8String;
|
|
begin
|
|
Surplus := '';
|
|
Result := cTagCount - 1;
|
|
for i := 0 to cTagCount - 1 do Candidates[i] := True;
|
|
AIndex := 1;
|
|
repeat
|
|
Found := False;
|
|
inc(AIndex);
|
|
if AReader.ReadChar(Ch) = 0 then
|
|
exit;
|
|
Surplus := Surplus + UTF8String(Ch);
|
|
for i := cTagCount - 1 downto 0 do
|
|
if Candidates[i] and (length(cTags[i].Start) >= AIndex) then
|
|
begin
|
|
if cTags[i].Start[AIndex] = Ch then
|
|
begin
|
|
Found := True;
|
|
if length(cTags[i].Start) = AIndex then
|
|
Result := i;
|
|
end else
|
|
Candidates[i] := False;
|
|
end;
|
|
until Found = False;
|
|
// The surplus string that we already read (everything after the tag)
|
|
AReader.Surplus := copy(Surplus, length(cTags[Result].Start), length(Surplus));
|
|
end;
|
|
|
|
function ReadStringFromStreamUntil(AReader: TsdSurplusReader; const ASearch: UTF8String;
|
|
var AValue: UTF8String; SkipQuotes: boolean): boolean;
|
|
var
|
|
AIndex, ValueIndex, SearchIndex: integer;
|
|
LastSearchChar, Ch: AnsiChar;
|
|
InQuotes: boolean;
|
|
QuoteChar: AnsiChar;
|
|
SB: TsdStringBuilder;
|
|
begin
|
|
Result := False;
|
|
InQuotes := False;
|
|
|
|
// Get last searchstring character
|
|
AIndex := length(ASearch);
|
|
if AIndex = 0 then exit;
|
|
LastSearchChar := ASearch[AIndex];
|
|
|
|
SB := TsdStringBuilder.Create;
|
|
try
|
|
QuoteChar := #0;
|
|
|
|
repeat
|
|
// Add characters to the value to be returned
|
|
if AReader.ReadChar(Ch) = 0 then
|
|
exit;
|
|
SB.AddChar(Ch);
|
|
|
|
// Do we skip quotes?
|
|
if SkipQuotes then
|
|
begin
|
|
if InQuotes then
|
|
begin
|
|
if (Ch = QuoteChar) then
|
|
InQuotes := false;
|
|
end else
|
|
begin
|
|
if Ch in cQuoteChars then
|
|
begin
|
|
InQuotes := true;
|
|
QuoteChar := Ch;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
// In quotes? If so, we don't check the end condition
|
|
if not InQuotes then
|
|
begin
|
|
// Is the last char the same as the last char of the search string?
|
|
if Ch = LastSearchChar then
|
|
begin
|
|
|
|
// Check to see if the whole search string is present
|
|
ValueIndex := SB.Length - 1;
|
|
SearchIndex := length(ASearch) - 1;
|
|
if ValueIndex < SearchIndex then continue;
|
|
|
|
Result := True;
|
|
while (SearchIndex > 0)and Result do
|
|
begin
|
|
Result := SB[ValueIndex] = ASearch[SearchIndex];
|
|
dec(ValueIndex);
|
|
dec(SearchIndex);
|
|
end;
|
|
end;
|
|
end;
|
|
until Result;
|
|
|
|
// Use only the part before the search string
|
|
AValue := SB.StringCopy(1, SB.Length - length(ASearch));
|
|
finally
|
|
SB.Free;
|
|
end;
|
|
end;
|
|
|
|
function ReadStringFromStreamWithQuotes(S: TStream; const Terminator: UTF8String;
|
|
var AValue: UTF8String): boolean;
|
|
var
|
|
Ch, QuoteChar: AnsiChar;
|
|
InQuotes: boolean;
|
|
SB: TsdStringBuilder;
|
|
begin
|
|
SB := TsdStringBuilder.Create;
|
|
try
|
|
QuoteChar := #0;
|
|
Result := False;
|
|
InQuotes := False;
|
|
repeat
|
|
if S.Read(Ch, 1) = 0 then exit;
|
|
if not InQuotes then
|
|
begin
|
|
if (Ch = '"') or (Ch = '''') then
|
|
begin
|
|
InQuotes := True;
|
|
QuoteChar := Ch;
|
|
end;
|
|
end else
|
|
begin
|
|
if Ch = QuoteChar then
|
|
InQuotes := False;
|
|
end;
|
|
if not InQuotes and (UTF8String(Ch) = Terminator) then
|
|
break;
|
|
SB.AddChar(Ch);
|
|
until False;
|
|
AValue := SB.Value;
|
|
Result := True;
|
|
finally
|
|
SB.Free;
|
|
end;
|
|
end;
|
|
|
|
function GetTimeZoneBias: Integer;
|
|
// uses windows unit, func GetTimeZoneInformation
|
|
var
|
|
TimeZoneInfo: TTimeZoneInformation;
|
|
begin
|
|
case GetTimeZoneInformation(TimeZoneInfo) of
|
|
TIME_ZONE_ID_UNKNOWN: Result := TimeZoneInfo.Bias;
|
|
TIME_ZONE_ID_STANDARD: Result := TimeZoneInfo.Bias + TimeZoneInfo.StandardBias;
|
|
TIME_ZONE_ID_DAYLIGHT: Result := TimeZoneInfo.Bias + TimeZoneInfo.DaylightBias;
|
|
else
|
|
Result := 0;
|
|
end;
|
|
end;
|
|
|
|
function sdDateTimeFromString(const ADate: UTF8String; UseLocalBias: Boolean): TDateTime;
|
|
// Convert the string ADate to a TDateTime according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
// contributor: Stefan Glienke
|
|
var
|
|
AYear, AMonth, ADay, AHour, AMin, ASec, AMSec: word;
|
|
ALocalBias, ABias: Integer;
|
|
begin
|
|
AYear := StrToInt(string(copy(ADate, 1, 4)));
|
|
AMonth := StrToInt(string(copy(ADate, 6, 2)));
|
|
ADay := StrToInt(string(copy(ADate, 9, 2)));
|
|
if Length(ADate) > 16 then
|
|
begin
|
|
AHour := StrToInt(string(copy(ADate, 12, 2)));
|
|
AMin := StrToInt(string(copy(ADate, 15, 2)));
|
|
ASec := StrToIntDef(string(copy(ADate, 18, 2)), 0); // They might be omitted, so default to 0
|
|
AMSec := StrToIntDef(string(copy(ADate, 21, 3)), 0); // They might be omitted, so default to 0
|
|
end else
|
|
begin
|
|
AHour := 0;
|
|
AMin := 0;
|
|
ASec := 0;
|
|
AMSec := 0;
|
|
end;
|
|
Result :=
|
|
EncodeDate(AYear, AMonth, ADay) +
|
|
EncodeTime(AHour, AMin, ASec, AMSec);
|
|
ALocalBias := GetTimeZoneBias;
|
|
if UseLocalBias then
|
|
begin
|
|
if (Length(ADate) > 24) then
|
|
begin
|
|
ABias := StrToInt(string(Copy(ADate, 25, 2))) * MinsPerHour +
|
|
StrToInt(string(Copy(ADate, 28, 2)));
|
|
if ADate[24] = '+' then
|
|
ABias := ABias * -1;
|
|
Result := Result + ABias / MinsPerDay;
|
|
end;
|
|
Result := Result - ALocalBias / MinsPerDay;
|
|
end;
|
|
end;
|
|
|
|
function sdDateTimeFromStringDefault(const ADate: UTF8String; ADefault: TDateTime; UseLocalBias: Boolean): TDateTime;
|
|
// Convert the string ADate to a TDateTime according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
// If there is a conversion error, the default value ADefault is returned.
|
|
begin
|
|
try
|
|
Result := sdDateTimeFromString(ADate, UseLocalBias);
|
|
except
|
|
Result := ADefault;
|
|
end;
|
|
end;
|
|
|
|
function sdDateTimeToString(ADate: TDateTime; UseLocalBias: Boolean): UTF8String;
|
|
// Convert the TDateTime ADate to a string according to the W3C date/time specification
|
|
// as found here: http://www.w3.org/TR/NOTE-datetime
|
|
// contributor: Stefan Glienke
|
|
var
|
|
AYear, AMonth, ADay, AHour, AMin, ASec, AMSec: word;
|
|
ABias: Integer;
|
|
const
|
|
Neg: array[Boolean] of string = ('+', '-');
|
|
begin
|
|
DecodeDate(ADate, AYear, AMonth, ADay);
|
|
DecodeTime(ADate, AHour, AMin, ASec, AMSec);
|
|
if frac(ADate) = 0 then
|
|
Result := UTF8String(Format('%.4d-%.2d-%.2d', [AYear, AMonth, ADay]))
|
|
else
|
|
begin
|
|
ABias := GetTimeZoneBias;
|
|
if UseLocalBias and (ABias <> 0) then
|
|
Result := UTF8String(Format('%.4d-%.2d-%.2dT%.2d:%.2d:%.2d.%.3d%s%.2d:%.2d',
|
|
[AYear, AMonth, ADay, AHour, AMin, ASec, AMSec,
|
|
Neg[ABias > 0], Abs(ABias) div MinsPerHour, Abs(ABias) mod MinsPerHour]))
|
|
else
|
|
Result := UTF8String(Format('%.4d-%.2d-%.2dT%.2d:%.2d:%.2d.%.3dZ',
|
|
[AYear, AMonth, ADay, AHour, AMin, ASec, AMSec]));
|
|
end;
|
|
end;
|
|
|
|
function sdWriteNumber(Value: double; SignificantDigits: integer; AllowScientific: boolean): UTF8String;
|
|
const
|
|
Limits: array[1..9] of integer =
|
|
(10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000, 1000000000);
|
|
var
|
|
Limit, Limitd, PointPos, IntVal, ScPower: integer;
|
|
Body: UTF8String;
|
|
begin
|
|
if (SignificantDigits < 1) or (SignificantDigits > 9) then
|
|
raise Exception.Create(sxeSignificantDigitsOutOfRange);
|
|
|
|
// Zero
|
|
if Value = 0 then
|
|
begin
|
|
Result := '0';
|
|
exit;
|
|
end;
|
|
|
|
// Sign
|
|
if Value < 0 then
|
|
begin
|
|
Result := '-';
|
|
Value := -Value;
|
|
end else
|
|
Result := '';
|
|
|
|
// Determine point position
|
|
Limit := Limits[SignificantDigits];
|
|
Limitd := Limit div 10;
|
|
PointPos := SignificantDigits;
|
|
while Value < Limitd do
|
|
begin
|
|
Value := Value * 10;
|
|
dec(PointPos);
|
|
end;
|
|
while Value >= Limit do
|
|
begin
|
|
Value := Value * 0.1;
|
|
inc(PointPos);
|
|
end;
|
|
|
|
// Round
|
|
IntVal := round(Value);
|
|
|
|
// Exceptional case which happens when the value rounds up to the limit
|
|
if Intval = Limit then
|
|
begin
|
|
IntVal := IntVal div 10;
|
|
inc(PointPos);
|
|
end;
|
|
|
|
// Strip off any zeros, these reduce significance count
|
|
while (IntVal mod 10 = 0) and (PointPos < SignificantDigits) do
|
|
begin
|
|
dec(SignificantDigits);
|
|
IntVal := IntVal div 10;
|
|
end;
|
|
|
|
// Check for scientific notation
|
|
ScPower := 0;
|
|
if AllowScientific and ((PointPos < -1) or (PointPos > SignificantDigits + 2)) then
|
|
begin
|
|
ScPower := PointPos - 1;
|
|
dec(PointPos, ScPower);
|
|
end;
|
|
|
|
// Body
|
|
Body := IntToUTF8Str(IntVal);
|
|
while PointPos > SignificantDigits do
|
|
begin
|
|
Body := Body + '0';
|
|
inc(SignificantDigits);
|
|
end;
|
|
while PointPos < 0 do
|
|
begin
|
|
Body := '0' + Body;
|
|
inc(PointPos);
|
|
end;
|
|
if PointPos = 0 then
|
|
Body := '.' + Body
|
|
else
|
|
if PointPos < SignificantDigits then
|
|
Body := copy(Body, 1, PointPos) + '.' + copy(Body, PointPos + 1, SignificantDigits);
|
|
|
|
// Final result
|
|
if ScPower = 0 then
|
|
Result := Result + Body
|
|
else
|
|
Result := Result + Body + 'E' + IntToUTF8Str(ScPower);
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
function sdUnicodeToUtf8(const W: UnicodeString): UTF8String;
|
|
begin
|
|
Result := Encoding.UTF8.GetBytes(W);
|
|
end;
|
|
|
|
function sdUtf8ToUnicode(const S: UTF8String): UnicodeString;
|
|
begin
|
|
Result := Encoding.UTF8.GetString(BytesOf(S));
|
|
end;
|
|
|
|
function EncodeBase64Buf(const Buffer: TBytes; Count: Integer): UTF8String;
|
|
begin
|
|
Result := Convert.ToBase64String(Buffer, 0, Count);
|
|
end;
|
|
|
|
function EncodeBase64(const Source: UTF8String): UTF8String;
|
|
begin
|
|
Result := Convert.ToBase64String(BytesOf(Source));
|
|
end;
|
|
|
|
procedure DecodeBase64Buf(const Source: UTF8String; var Buffer: TBytes; Count: Integer);
|
|
var
|
|
ADecoded: TBytes;
|
|
begin
|
|
ADecoded := Convert.FromBase64String(Source);
|
|
if Count > Length(ADecoded) then
|
|
raise EFilerError.Create(sxeMissingDataInBinaryStream);
|
|
SetLength(ADecoded, Count);
|
|
Buffer := ADecoded;
|
|
end;
|
|
|
|
function DecodeBase64(const Source: UTF8String): UTF8String;
|
|
begin
|
|
Result := UTF8String(Convert.FromBase64String(Source));
|
|
end;
|
|
|
|
{$ELSE}
|
|
|
|
function PtrUnicodeToUtf8(Dest: PAnsiChar; MaxDestBytes: Cardinal; Source: PUnicodeChar; SourceChars: Cardinal): Cardinal;
|
|
var
|
|
i, count: Cardinal;
|
|
c: Cardinal;
|
|
begin
|
|
Result := 0;
|
|
if not assigned(Source) or not assigned(Dest) then
|
|
exit;
|
|
|
|
count := 0;
|
|
i := 0;
|
|
|
|
while (i < SourceChars) and (count < MaxDestBytes) do
|
|
begin
|
|
c := Cardinal(Source[i]);
|
|
Inc(i);
|
|
if c <= $7F then
|
|
begin
|
|
Dest[count] := AnsiChar(c);
|
|
Inc(count);
|
|
end else
|
|
if c > $7FF then
|
|
begin
|
|
if count + 3 > MaxDestBytes then
|
|
break;
|
|
Dest[count] := AnsiChar($E0 or (c shr 12));
|
|
Dest[count+1] := AnsiChar($80 or ((c shr 6) and $3F));
|
|
Dest[count+2] := AnsiChar($80 or (c and $3F));
|
|
Inc(count,3);
|
|
end else
|
|
begin // $7F < Source[i] <= $7FF
|
|
if count + 2 > MaxDestBytes then
|
|
break;
|
|
Dest[count] := AnsiChar($C0 or (c shr 6));
|
|
Dest[count+1] := AnsiChar($80 or (c and $3F));
|
|
Inc(count,2);
|
|
end;
|
|
end;
|
|
if count >= MaxDestBytes then
|
|
count := MaxDestBytes-1;
|
|
Dest[count] := #0;
|
|
Result := count + 1; // convert zero based index to byte count
|
|
end;
|
|
|
|
function PtrUtf8ToUnicode(Dest: PUnicodeChar; MaxDestChars: Cardinal; Source: PAnsiChar;
|
|
SourceBytes: Cardinal): Cardinal;
|
|
var
|
|
i, count: Cardinal;
|
|
c: Byte;
|
|
wc: Cardinal;
|
|
begin
|
|
if not assigned(Dest) or not assigned(Source) then
|
|
begin
|
|
Result := 0;
|
|
Exit;
|
|
end;
|
|
Result := Cardinal(-1);
|
|
count := 0;
|
|
i := 0;
|
|
while (i < SourceBytes) and (count < MaxDestChars) do
|
|
begin
|
|
wc := Cardinal(Source[i]);
|
|
Inc(i);
|
|
if (wc and $80) <> 0 then
|
|
begin
|
|
if i >= SourceBytes then
|
|
// incomplete multibyte char
|
|
Exit;
|
|
wc := wc and $3F;
|
|
if (wc and $20) <> 0 then
|
|
begin
|
|
c := Byte(Source[i]);
|
|
Inc(i);
|
|
if (c and $C0) <> $80 then
|
|
// malformed trail byte or out of range char
|
|
Exit;
|
|
if i >= SourceBytes then
|
|
// incomplete multibyte char
|
|
Exit;
|
|
wc := (wc shl 6) or (c and $3F);
|
|
end;
|
|
c := Byte(Source[i]);
|
|
Inc(i);
|
|
if (c and $C0) <> $80 then
|
|
// malformed trail byte
|
|
Exit;
|
|
Dest[count] := UnicodeChar((wc shl 6) or (c and $3F));
|
|
end else
|
|
Dest[count] := UnicodeChar(wc);
|
|
Inc(count);
|
|
end;
|
|
|
|
if count >= MaxDestChars then
|
|
count := MaxDestChars-1;
|
|
|
|
Dest[count] := #0;
|
|
Result := count + 1;
|
|
end;
|
|
|
|
function sdUnicodeToUtf8(const W: UnicodeString): UTF8String;
|
|
var
|
|
L: integer;
|
|
Temp: UTF8String;
|
|
begin
|
|
Result := '';
|
|
if W = '' then
|
|
Exit;
|
|
SetLength(Temp, Length(W) * 3); // SetLength includes space for null terminator
|
|
|
|
L := PtrUnicodeToUtf8(PAnsiChar(Temp), Length(Temp) + 1, PUnicodeChar(W), Length(W));
|
|
if L > 0 then
|
|
SetLength(Temp, L - 1)
|
|
else
|
|
Temp := '';
|
|
Result := Temp;
|
|
end;
|
|
|
|
function sdUtf8ToUnicode(const S: UTF8String): UnicodeString;
|
|
var
|
|
L: Integer;
|
|
Temp: UnicodeString;
|
|
begin
|
|
Result := '';
|
|
if S = '' then
|
|
Exit;
|
|
SetLength(Temp, Length(S));
|
|
|
|
L := PtrUtf8ToUnicode(PUnicodeChar(Temp), Length(Temp)+1, PAnsiChar(S), Length(S));
|
|
if L > 0 then
|
|
SetLength(Temp, L-1)
|
|
else
|
|
Temp := '';
|
|
Result := Temp;
|
|
end;
|
|
|
|
function EncodeBase64Buf(const Buffer; Count: Integer): UTF8String;
|
|
var
|
|
i, j: integer;
|
|
ACore: integer;
|
|
ALong: cardinal;
|
|
S: PByte;
|
|
begin
|
|
// Make sure ASize is always a multiple of 3, and this multiple
|
|
// gets saved as 4 characters
|
|
ACore := (Count + 2) div 3;
|
|
|
|
// Set the length of the string that stores encoded characters
|
|
SetLength(Result, ACore * 4);
|
|
S := @Buffer;
|
|
// Do the loop ACore times
|
|
for i := 0 to ACore - 1 do
|
|
begin
|
|
ALong := 0;
|
|
for j := 0 to 2 do
|
|
begin
|
|
ALong := ALong shl 8 + S^;
|
|
inc(S);
|
|
end;
|
|
for j := 0 to 3 do
|
|
begin
|
|
Result[i * 4 + 4 - j] := cBase64Char[ALong and $3F];
|
|
ALong := ALong shr 6;
|
|
end;
|
|
end;
|
|
// For comformity to Base64, we must pad the data instead of zero out
|
|
// if the size is not an exact multiple of 3
|
|
case ACore * 3 - Count of
|
|
0:;// nothing to do
|
|
1: // pad one byte
|
|
Result[ACore * 4] := cBase64PadChar;
|
|
2: // pad two bytes
|
|
begin
|
|
Result[ACore * 4 ] := cBase64PadChar;
|
|
Result[ACore * 4 - 1] := cBase64PadChar;
|
|
end;
|
|
end;//case
|
|
end;
|
|
|
|
function EncodeBase64(const Source: RawByteString): UTF8String;
|
|
// Encode binary data in Source as BASE64. The function returns the BASE64 encoded
|
|
// data as string, without any linebreaks.
|
|
begin
|
|
if length(Source) > 0 then
|
|
Result := EncodeBase64Buf(Source[1], length(Source))
|
|
else
|
|
Result := '';
|
|
end;
|
|
|
|
procedure DecodeBase64Buf(var Source: UTF8String; var Buffer; Count: Integer);
|
|
var
|
|
i, j: integer;
|
|
BufPos, Core: integer;
|
|
LongVal: cardinal;
|
|
D: PByte;
|
|
Map: array[AnsiChar] of byte;
|
|
begin
|
|
// Core * 4 is the number of chars to read - check length
|
|
Core := Length(Source) div 4;
|
|
if Count > Core * 3 then
|
|
raise EFilerError.Create(sxeMissingDataInBinaryStream);
|
|
|
|
// Prepare map
|
|
for i := 0 to 63 do
|
|
Map[cBase64Char[i]] := i;
|
|
D := @Buffer;
|
|
|
|
// Check for final padding, and replace with "zeros". There can be
|
|
// at max two pad chars ('=')
|
|
BufPos := length(Source);
|
|
if (BufPos > 0) and (Source[BufPos] = cBase64PadChar) then
|
|
begin
|
|
Source[BufPos] := cBase64Char[0];
|
|
dec(BufPos);
|
|
if (BufPos > 0) and (Source[BufPos] = cBase64PadChar) then
|
|
Source[BufPos] := cBase64Char[0];
|
|
end;
|
|
|
|
// Do this Core times
|
|
for i := 0 to Core - 1 do
|
|
begin
|
|
LongVal := 0;
|
|
// Unroll the characters
|
|
for j := 0 to 3 do
|
|
LongVal := LongVal shl 6 + Map[Source[i * 4 + j + 1]];
|
|
// and unroll the bytes
|
|
for j := 2 downto 0 do
|
|
begin
|
|
// Check overshoot
|
|
if integer(D) - integer(@Buffer) >= Count then
|
|
exit;
|
|
D^ := LongVal shr (j * 8) and $FF;
|
|
inc(D);
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
function DecodeBase64(const Source: UTF8String): RawByteString;
|
|
// Decode BASE64 data in Source into binary data. The function returns the binary
|
|
// data as UTF8String. Use a TStringStream to convert this data to a stream.
|
|
var
|
|
BufData: UTF8String;
|
|
BufSize, BufPos: integer;
|
|
begin
|
|
BufData := sdRemoveControlChars(Source);
|
|
|
|
// Determine length of data
|
|
BufSize := length(BufData) div 4;
|
|
if BufSize * 4 <> length(BufData) then
|
|
raise EFilerError.Create(sxeErrorCalcStreamLength);
|
|
BufSize := BufSize * 3;
|
|
// Check padding AnsiChars
|
|
BufPos := length(BufData);
|
|
if (BufPos > 0) and (BufData[BufPos] = cBase64PadChar) then
|
|
begin
|
|
dec(BufPos);
|
|
dec(BufSize);
|
|
if (BufPos > 0) and (BufData[BufPos] = cBase64PadChar) then
|
|
dec(BufSize);
|
|
end;
|
|
Setlength(Result, BufSize);
|
|
|
|
// Decode
|
|
if BufSize > 0 then
|
|
DecodeBase64Buf(BufData, Result[1], BufSize);
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
function sdAnsiToUtf8(const S: AnsiString): UTF8String;
|
|
begin
|
|
// We let the OS figure out Ansi<->Unicode
|
|
Result := sdUnicodeToUtf8(UnicodeString(S));
|
|
end;
|
|
|
|
function sdUtf8ToAnsi(const S: UTF8String): AnsiString;
|
|
begin
|
|
// We let the OS figure out Ansi<->Unicode. There might be dataloss!
|
|
Result := Ansistring(sdUtf8ToUnicode(S));
|
|
end;
|
|
|
|
function EncodeBinHexBuf(const Source; Count: Integer): UTF8String;
|
|
// Encode binary data in Source as BINHEX. The function returns the BINHEX encoded
|
|
// data as UTF8String, without any linebreaks.
|
|
var
|
|
{$IFDEF CLR}
|
|
Text: TBytes;
|
|
{$ELSE}
|
|
Text: UTF8String;
|
|
{$ENDIF}
|
|
begin
|
|
SetLength(Text, Count * 2);
|
|
{$IFDEF CLR}
|
|
BinToHex(TBytes(Source), 0, Text, 0, Count);
|
|
{$ELSE}
|
|
BinToHex(PAnsiChar(@Source), PAnsiChar(Text), Count);
|
|
{$ENDIF}
|
|
Result := Text;
|
|
end;
|
|
|
|
function EncodeBinHex(const Source: RawByteString): UTF8String;
|
|
// Encode binary data in Source as BINHEX. The function returns the BINHEX encoded
|
|
// data as UTF8String, without any linebreaks.
|
|
var
|
|
{$IFDEF CLR}
|
|
Text: TBytes;
|
|
{$ELSE}
|
|
Text: UTF8String;
|
|
{$ENDIF}
|
|
begin
|
|
SetLength(Text, Length(Source) * 2);
|
|
{$IFDEF CLR}
|
|
BinToHex(BytesOf(Source), 0, Text, 0, Length(Source));
|
|
{$ELSE}
|
|
BinToHex(PAnsiChar(Source), PAnsiChar(Text), Length(Source));
|
|
{$ENDIF}
|
|
Result := Text;
|
|
end;
|
|
|
|
procedure DecodeBinHexBuf(const Source: UTF8String; var Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Count: Integer);
|
|
// Decode BINHEX data in Source into binary data.
|
|
begin
|
|
if Length(Source) div 2 < Count then
|
|
raise EFilerError.Create(sxeMissingDataInBinaryStream);
|
|
|
|
{$IFDEF CLR}
|
|
HexToBin(BytesOf(Source), 0, Buffer, 0, Count);
|
|
{$ELSE}
|
|
HexToBin(PAnsiChar(Source), PAnsiChar(@Buffer), Count);
|
|
{$ENDIF}
|
|
end;
|
|
|
|
function DecodeBinHex(const Source: UTF8String): RawByteString;
|
|
// Decode BINHEX data in Source into binary data. The function returns the binary
|
|
// data as RawByteString. Use a TStringStream to convert this data to a stream.
|
|
var
|
|
Data: Utf8String;
|
|
Size: integer;
|
|
{$IFDEF CLR}
|
|
Buffer: TBytes;
|
|
{$ELSE}
|
|
Buffer: RawByteString;
|
|
{$ENDIF}
|
|
begin
|
|
Data := sdRemoveControlChars(Source);
|
|
|
|
// Determine length of data
|
|
Size := length(Data) div 2;
|
|
if Size * 2 <> length(Data) then
|
|
raise EFilerError.Create(sxeErrorCalcStreamLength);
|
|
|
|
SetLength(Buffer, Size);
|
|
{$IFDEF CLR}
|
|
HexToBin(BytesOf(Data), 0, Buffer, 0, Size);
|
|
{$ELSE}
|
|
HexToBin(PAnsiChar(Data), PAnsiChar(Buffer), Size);
|
|
{$ENDIF}
|
|
Result := Buffer;
|
|
end;
|
|
|
|
function sdStringToBool(const AValue: UTF8String): boolean;
|
|
var
|
|
Ch: AnsiChar;
|
|
begin
|
|
if Length(AValue) > 0 then
|
|
begin
|
|
Ch := sdUpCase(AValue[1]);
|
|
if Ch in ['T', 'Y', '1'] then
|
|
begin
|
|
Result := True;
|
|
exit;
|
|
end;
|
|
if Ch in ['F', 'N', '0'] then
|
|
begin
|
|
Result := False;
|
|
exit;
|
|
end;
|
|
end;
|
|
raise Exception.Create(sxeCannotConverToBool);
|
|
end;
|
|
|
|
function sdStringFromBool(ABool: boolean): UTF8String;
|
|
const
|
|
cBoolValues: array[boolean] of UTF8String = ('false', 'true');
|
|
begin
|
|
Result := cBoolValues[ABool];
|
|
end;
|
|
|
|
{ TsdUTF8StringList }
|
|
|
|
function TsdUTF8StringList.Add(const S: UTF8String): integer;
|
|
var
|
|
L: integer;
|
|
begin
|
|
L := Length(FItems);
|
|
if L = FCount then
|
|
begin
|
|
// Increase capacity
|
|
SetLength(FItems, FCount + 4);
|
|
end;
|
|
FItems[FCount] := S;
|
|
Result := FCount;
|
|
inc(FCount);
|
|
end;
|
|
|
|
procedure TsdUTF8StringList.Assign(Source: TPersistent);
|
|
var
|
|
i: integer;
|
|
SL: TsdUTF8StringList;
|
|
begin
|
|
if Source is TsdUTF8StringList then
|
|
begin
|
|
SL := TsdUTF8StringList(Source);
|
|
SetLength(FItems, SL.FCount);
|
|
for i := 0 to SL.FCount - 1 do
|
|
FItems[i] := SL.FItems[i];
|
|
FCount := SL.FCount;
|
|
end else
|
|
inherited;
|
|
end;
|
|
|
|
procedure TsdUTF8StringList.Clear;
|
|
begin
|
|
FCount := 0;
|
|
end;
|
|
|
|
procedure TsdUTF8StringList.Delete(Index: Integer);
|
|
var
|
|
i: integer;
|
|
begin
|
|
if (Index < 0) or (Index >= Count) then
|
|
exit;
|
|
for i := Index + 1 to Count - 1 do
|
|
FItems[i - 1] := FItems[i];
|
|
dec(FCount);
|
|
end;
|
|
|
|
function TsdUTF8StringList.GetItems(Index: integer): UTF8String;
|
|
begin
|
|
if (Index >= 0) and (Index < Count) then
|
|
Result := FItems[Index]
|
|
else
|
|
Result := '';
|
|
end;
|
|
|
|
function TsdUTF8StringList.GetNames(Index: integer): UTF8String;
|
|
var
|
|
P: integer;
|
|
begin
|
|
Result := Items[Index];
|
|
P := UTF8Pos('=', Result);
|
|
if P <> 0 then
|
|
SetLength(Result, P - 1)
|
|
else
|
|
SetLength(Result, 0);
|
|
end;
|
|
|
|
function TsdUTF8StringList.GetText: UTF8String;
|
|
const
|
|
cLB: UTF8String = #13#10;
|
|
var
|
|
i, L, LItem: integer;
|
|
P: PAnsiChar;
|
|
begin
|
|
L := 0;
|
|
for i := 0 to Count - 1 do
|
|
begin
|
|
inc(L, length(FItems[i]));
|
|
inc(L, 2);
|
|
end;
|
|
SetLength(Result, L);
|
|
if L = 0 then
|
|
exit;
|
|
P := @Result[1];
|
|
for i := 0 to Count - 1 do
|
|
begin
|
|
LItem := length(FItems[i]);
|
|
if LItem > 0 then
|
|
begin
|
|
System.Move(FItems[i][1], P^, LItem);
|
|
inc(P, LItem);
|
|
end;
|
|
System.Move(cLB[1], P^, 2);
|
|
inc(P, 2);
|
|
end;
|
|
end;
|
|
|
|
function TsdUTF8StringList.GetValues(const Name: UTF8String): UTF8String;
|
|
var
|
|
Idx: integer;
|
|
begin
|
|
Idx := IndexOfName(Name);
|
|
if Idx >= 0 then
|
|
Result := Copy(FItems[Idx], Length(Name) + 2, MaxInt)
|
|
else
|
|
Result := '';
|
|
end;
|
|
|
|
function TsdUTF8StringList.IndexOfName(const Name: UTF8String): integer;
|
|
begin
|
|
for Result := 0 to Count - 1 do
|
|
begin
|
|
if sdUTF8MatchString(Name + '=', FItems[Result], 1) then
|
|
exit;
|
|
end;
|
|
Result := -1;
|
|
end;
|
|
|
|
procedure TsdUTF8StringList.SetItems(Index: integer; const Value: UTF8String);
|
|
begin
|
|
if (Index >= 0) and (Index < Count) then
|
|
FItems[Index] := Value;
|
|
end;
|
|
|
|
procedure TsdUTF8StringList.SetValues(const Name, Value: UTF8String);
|
|
var
|
|
Idx: integer;
|
|
begin
|
|
Idx := IndexOfName(Name);
|
|
if Value <> '' then
|
|
begin
|
|
if Idx < 0 then
|
|
Idx := Add('');
|
|
FItems[Idx] := Name + '=' + Value;
|
|
end else
|
|
Delete(Idx);
|
|
end;
|
|
|
|
{ TXmlNode }
|
|
|
|
function TXmlNode.AbortParsing: boolean;
|
|
begin
|
|
Result := assigned(Document) and Document.AbortParsing;
|
|
end;
|
|
|
|
procedure TXmlNode.Assign(Source: TPersistent);
|
|
var
|
|
i: integer;
|
|
Node: TXmlNode;
|
|
begin
|
|
if Source is TXmlNode then
|
|
begin
|
|
// Clear first
|
|
Clear;
|
|
|
|
// Properties
|
|
FElementType := TXmlNode(Source).FElementType;
|
|
FName := TXmlNode(Source).FName;
|
|
FTag := TXmlNode(Source).FTag;
|
|
FValue := TXmlNode(Source).FValue;
|
|
|
|
// Attributes
|
|
if assigned(TXmlNode(Source).FAttributes) then
|
|
begin
|
|
CheckCreateAttributesList;
|
|
FAttributes.Assign(TXmlNode(Source).FAttributes);
|
|
end;
|
|
|
|
// Nodes
|
|
for i := 0 to TXmlNode(Source).NodeCount - 1 do
|
|
begin
|
|
Node := NodeNew('');
|
|
Node.Assign(TXmlNode(Source).Nodes[i]);
|
|
end;
|
|
end else
|
|
if Source is TNativeXml then
|
|
begin
|
|
Assign(TNativeXml(Source).FRootNodes);
|
|
end else
|
|
inherited;
|
|
end;
|
|
|
|
procedure TXmlNode.AttributeAdd(const AName, AValue: UTF8String);
|
|
var
|
|
Attr: UTF8String;
|
|
begin
|
|
Attr := UTF8String(Format('%s=%s', [AName, sdUTF8QuotedString(sdUTF8EscapeString(AValue))]));
|
|
CheckCreateAttributesList;
|
|
FAttributes.Add(Attr);
|
|
end;
|
|
|
|
procedure TXmlNode.AttributeAdd(const AName: UTF8String; AValue: integer);
|
|
begin
|
|
AttributeAdd(AName, IntToUTF8Str(AValue));
|
|
end;
|
|
|
|
procedure TXmlNode.AttributeDelete(Index: integer);
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
FAttributes.Delete(Index);
|
|
end;
|
|
|
|
procedure TXmlNode.AttributeExchange(Index1, Index2: integer);
|
|
var
|
|
Temp: UTF8String;
|
|
begin
|
|
if (Index1 <> Index2) and
|
|
(Index1 >= 0) and (Index1 < FAttributes.Count) and
|
|
(Index2 >= 0) and (Index2 < FAttributes.Count) then
|
|
begin
|
|
Temp := FAttributes[Index1];
|
|
FAttributes[Index1] := FAttributes[Index2];
|
|
FAttributes[Index2] := Temp;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.AttributeIndexByname(const AName: UTF8String): integer;
|
|
// Return the index of the attribute with name AName, or -1 if not found
|
|
begin
|
|
if assigned(FAttributes) then
|
|
Result := FAttributes.IndexOfName(AName)
|
|
else
|
|
Result := -1;
|
|
end;
|
|
|
|
procedure TXmlNode.AttributesClear;
|
|
begin
|
|
FreeAndNil(FAttributes);
|
|
end;
|
|
|
|
function TXmlNode.BufferLength: integer;
|
|
var
|
|
BufData: UTF8String;
|
|
BufPos: integer;
|
|
begin
|
|
BufData := sdRemoveControlChars(FValue);
|
|
case BinaryEncoding of
|
|
xbeBinHex:
|
|
begin
|
|
Result := length(BufData) div 2;
|
|
if Result * 2 <> length(BufData) then
|
|
raise EFilerError.Create(sxeErrorCalcStreamLength);
|
|
end;
|
|
xbeBase64:
|
|
begin
|
|
Result := length(BufData) div 4;
|
|
if Result * 4 <> length(BufData) then
|
|
raise EFilerError.Create(sxeErrorCalcStreamLength);
|
|
Result := Result * 3;
|
|
// Check padding AnsiChars
|
|
BufPos := length(BufData);
|
|
if (BufPos > 0) and (BufData[BufPos] = cBase64PadChar) then
|
|
begin
|
|
dec(BufPos);
|
|
dec(Result);
|
|
if (BufPos > 0) and (BufData[BufPos] = cBase64PadChar) then
|
|
dec(Result);
|
|
end;
|
|
end;
|
|
else
|
|
Result := 0; // avoid compiler warning
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.BufferRead(var Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Count: Integer);
|
|
// Read data from XML binhex to the buffer
|
|
var
|
|
BufData: UTF8String;
|
|
begin
|
|
BufData := sdRemoveControlChars(FValue);
|
|
case BinaryEncoding of
|
|
xbeBinHex:
|
|
DecodeBinHexBuf(BufData, Buffer, Count);
|
|
xbeBase64:
|
|
DecodeBase64Buf(BufData, Buffer, Count);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.BufferWrite(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Count: Integer);
|
|
// Write data from the buffer to XML in binhex or base64 format
|
|
var
|
|
BufData: UTF8String;
|
|
begin
|
|
if Count > 0 then
|
|
case BinaryEncoding of
|
|
xbeBinHex:
|
|
BufData := EncodeBinHexBuf(Buffer, Count);
|
|
xbeBase64:
|
|
BufData := EncodeBase64Buf(Buffer, Count);
|
|
end;
|
|
|
|
// For comformity with Base64, we must add linebreaks each 76 AnsiCharacters
|
|
FValue := sdAddControlChars(BufData, GetLineFeed + GetIndent, 76);
|
|
end;
|
|
|
|
procedure TXmlNode.ChangeDocument(ADocument: TNativeXml);
|
|
var
|
|
i: integer;
|
|
begin
|
|
FDocument := ADocument;
|
|
for i := 0 to NodeCount - 1 do
|
|
Nodes[i].ChangeDocument(ADocument);
|
|
end;
|
|
|
|
procedure TXmlNode.CheckCreateAttributesList;
|
|
begin
|
|
if not assigned(FAttributes) then
|
|
FAttributes := TsdUTF8StringList.Create;
|
|
end;
|
|
|
|
procedure TXmlNode.Clear;
|
|
begin
|
|
// Name + value
|
|
FName := '';
|
|
FValue := '';
|
|
// Clear attributes and nodes
|
|
AttributesClear;
|
|
NodesClear;
|
|
end;
|
|
|
|
function TXmlNode.CompareNodeName(const NodeName: UTF8String): integer;
|
|
begin
|
|
// Compare with FullPath or local name based on NodeName's first AnsiCharacter
|
|
if length(NodeName) > 0 then
|
|
if NodeName[1] = '/' then
|
|
begin
|
|
// FullPath
|
|
Result := UTF8CompareText(FullPath, NodeName);
|
|
exit;
|
|
end;
|
|
// local name
|
|
Result := UTF8CompareText(Name, NodeName);
|
|
end;
|
|
|
|
constructor TXmlNode.Create(ADocument: TNativeXml);
|
|
begin
|
|
inherited Create;
|
|
FDocument := ADocument;
|
|
end;
|
|
|
|
constructor TXmlNode.CreateName(ADocument: TNativeXml; const AName: UTF8String);
|
|
begin
|
|
Create(ADocument);
|
|
Name := AName;
|
|
end;
|
|
|
|
constructor TXmlNode.CreateNameValue(ADocument: TNativeXml; const AName, AValue: UTF8String);
|
|
begin
|
|
Create(ADocument);
|
|
Name := AName;
|
|
ValueAsString := AValue;
|
|
end;
|
|
|
|
constructor TXmlNode.CreateType(ADocument: TNativeXml;
|
|
AType: TXmlElementType);
|
|
begin
|
|
Create(ADocument);
|
|
FElementType := AType;
|
|
end;
|
|
|
|
procedure TXmlNode.Delete;
|
|
begin
|
|
if assigned(Parent) then
|
|
Parent.NodeRemove(Self);
|
|
end;
|
|
|
|
procedure TXmlNode.DeleteEmptyAttributes;
|
|
var
|
|
i: integer;
|
|
V: UTF8String;
|
|
begin
|
|
for i := AttributeCount - 1 downto 0 do
|
|
begin
|
|
V := AttributeValue[i];
|
|
if length(V) = 0 then
|
|
FAttributes.Delete(i);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.DeleteEmptyNodes;
|
|
var
|
|
i: integer;
|
|
Node: TXmlNode;
|
|
begin
|
|
for i := NodeCount - 1 downto 0 do
|
|
begin
|
|
Node := Nodes[i];
|
|
// Recursive call
|
|
Node.DeleteEmptyNodes;
|
|
// Check if we should delete child node
|
|
if Node.IsEmpty then
|
|
NodeDelete(i);
|
|
end;
|
|
end;
|
|
|
|
destructor TXmlNode.Destroy;
|
|
begin
|
|
NodesClear;
|
|
AttributesClear;
|
|
inherited;
|
|
end;
|
|
|
|
function TXmlNode.FindNode(const NodeName: UTF8String): TXmlNode;
|
|
// Find the first node which has name NodeName. Contrary to the NodeByName
|
|
// function, this function will search the whole subnode tree, using the
|
|
// DepthFirst method.
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := nil;
|
|
// Loop through all subnodes
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
Result := Nodes[i];
|
|
// If the subnode has name NodeName then we have a result, exit
|
|
if Result.CompareNodeName(NodeName) = 0 then
|
|
exit;
|
|
// If not, we will search the subtree of this node
|
|
Result := Result.FindNode(NodeName);
|
|
if assigned(Result) then
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.FindNodes(const NodeName: UTF8String; const AList: TList);
|
|
// local
|
|
procedure FindNodesRecursive(ANode: TXmlNode; AList: TList);
|
|
var
|
|
i: integer;
|
|
begin
|
|
with ANode do
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
if Nodes[i].CompareNodeName(NodeName) = 0 then
|
|
AList.Add(Nodes[i]);
|
|
FindNodesRecursive(Nodes[i], AList);
|
|
end;
|
|
end;
|
|
// main
|
|
begin
|
|
AList.Clear;
|
|
FindNodesRecursive(Self, AList);
|
|
end;
|
|
|
|
function TXmlNode.FloatAllowScientific: boolean;
|
|
begin
|
|
if assigned(Document) then
|
|
Result := Document.FloatAllowScientific
|
|
else
|
|
Result := cDefaultFloatAllowScientific;
|
|
end;
|
|
|
|
function TXmlNode.FloatSignificantDigits: integer;
|
|
begin
|
|
if assigned(Document) then
|
|
Result := Document.FloatSignificantDigits
|
|
else
|
|
Result := cDefaultFloatSignificantDigits;
|
|
end;
|
|
|
|
function TXmlNode.FromAnsiString(const s: AnsiString): UTF8String;
|
|
begin
|
|
Result := sdAnsiToUtf8(s)
|
|
end;
|
|
|
|
function TXmlNode.FromUnicodeString(const W: UnicodeString): UTF8String;
|
|
begin
|
|
Result := sdUnicodeToUtf8(W)
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeByName(const AName: UTF8String): UTF8String;
|
|
begin
|
|
if assigned(FAttributes) then
|
|
Result := sdUTF8UnEscapeString(sdUTF8UnQuotedString(FAttributes.Values[AName]))
|
|
else
|
|
Result := '';
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeByNameWide(const AName: UTF8String): UnicodeString;
|
|
begin
|
|
Result := ToUnicodeString(GetAttributeByName(AName));
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeCount: integer;
|
|
begin
|
|
if assigned(FAttributes) then
|
|
Result := FAttributes.Count
|
|
else
|
|
Result := 0;
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeName(Index: integer): UTF8String;
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
Result := FAttributes.Names[Index];
|
|
end;
|
|
|
|
function TXmlNode.GetAttributePair(Index: integer): UTF8String;
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
Result := FAttributes[Index];
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeValue(Index: integer): UTF8String;
|
|
var
|
|
P: integer;
|
|
S: UTF8String;
|
|
begin
|
|
Result := '';
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
begin
|
|
S := FAttributes[Index];
|
|
P := Utf8Pos('=', S);
|
|
if P > 0 then
|
|
Result := sdUTF8UnEscapeString(sdUTF8UnQuotedString(Copy(S, P + 1, MaxInt)));
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeValueAsInteger(Index: integer): integer;
|
|
begin
|
|
Result := StrToIntDef(string(GetAttributeValue(Index)), 0);
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeValueAsUnicodeString(Index: integer): UnicodeString;
|
|
begin
|
|
Result := ToUnicodeString(GetAttributeValue(Index));
|
|
end;
|
|
|
|
function TXmlNode.GetAttributeValueDirect(Index: integer): UTF8String;
|
|
var
|
|
P: integer;
|
|
S: UTF8String;
|
|
begin
|
|
Result := '';
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
begin
|
|
S := FAttributes[Index];
|
|
P := Utf8Pos('=', S);
|
|
if P > 0 then
|
|
Result := sdUTF8UnQuotedString(Copy(S, P + 1, MaxInt));
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.GetBinaryEncoding: TBinaryEncodingType;
|
|
begin
|
|
Result := xbeBinHex;
|
|
if assigned(Document) then
|
|
Result := Document.BinaryEncoding;
|
|
end;
|
|
|
|
function TXmlNode.GetBinaryString: RawByteString;
|
|
// Get the binary contents of this node as Base64 and return it as a RawByteString
|
|
var
|
|
OldEncoding: TBinaryEncodingType;
|
|
{$IFDEF CLR}
|
|
Buffer: TBytes;
|
|
{$ENDIF}
|
|
begin
|
|
// Set to base64
|
|
OldEncoding := BinaryEncoding;
|
|
try
|
|
BinaryEncoding := xbeBase64;
|
|
{$IFDEF CLR}
|
|
SetLength(Buffer, BufferLength);
|
|
if length(Buffer) > 0 then
|
|
BufferRead(Buffer, length(Buffer));
|
|
Result := Buffer;
|
|
{$ELSE}
|
|
SetLength(Result, BufferLength);
|
|
if length(Result) > 0 then
|
|
BufferRead(Result[1], length(Result));
|
|
{$ENDIF}
|
|
finally
|
|
BinaryEncoding := OldEncoding;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.GetCascadedName: UTF8String;
|
|
// Return the name+index and all predecessors with underscores to separate, in
|
|
// order to get a unique reference that can be used in filenames
|
|
var
|
|
LName: UTF8String;
|
|
begin
|
|
LName := UTF8String(Format('%s%.4d', [Name, StrToIntDef(string(AttributeByName['Index']), 0)]));
|
|
if assigned(Parent) then
|
|
Result := UTF8String(Format('%s_%s', [Parent.CascadedName, LName]))
|
|
else
|
|
Result := LName;
|
|
end;
|
|
|
|
function TXmlNode.GetFullPath: UTF8String;
|
|
// GetFullpath will return the complete path of the node from the root, e.g.
|
|
// /Root/SubNode1/SubNode2/ThisNode
|
|
begin
|
|
Result := '/' + Name;
|
|
if Treedepth > 0 then
|
|
// Recursive call
|
|
Result := Parent.GetFullPath + Result;
|
|
end;
|
|
|
|
function TXmlNode.GetIndent: UTF8String;
|
|
var
|
|
i: integer;
|
|
begin
|
|
if assigned(Document) then
|
|
begin
|
|
case Document.XmlFormat of
|
|
xfCompact: Result := '';
|
|
xfReadable:
|
|
for i := 0 to TreeDepth - 1 do
|
|
Result := Result + Document.IndentString;
|
|
end; //case
|
|
end else
|
|
Result := ''
|
|
end;
|
|
|
|
function TXmlNode.GetLineFeed: UTF8String;
|
|
begin
|
|
if assigned(Document) then
|
|
begin
|
|
case Document.XmlFormat of
|
|
xfCompact: Result := '';
|
|
xfReadable: Result := #13#10;
|
|
else
|
|
Result := #10;
|
|
end; //case
|
|
end else
|
|
Result := '';
|
|
end;
|
|
|
|
function TXmlNode.GetNodeCount: integer;
|
|
begin
|
|
if Assigned(FNodes) then
|
|
Result := FNodes.Count
|
|
else
|
|
Result := 0;
|
|
end;
|
|
|
|
function TXmlNode.GetNodes(Index: integer): TXmlNode;
|
|
begin
|
|
if (Index >= 0) and (Index < NodeCount) then
|
|
Result := TXmlNode(FNodes[Index])
|
|
else
|
|
Result := nil;
|
|
end;
|
|
|
|
function TXmlNode.GetTotalNodeCount: integer;
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := NodeCount;
|
|
for i := 0 to NodeCount - 1 do
|
|
inc(Result, Nodes[i].TotalNodeCount);
|
|
end;
|
|
|
|
function TXmlNode.GetTreeDepth: integer;
|
|
begin
|
|
Result := -1;
|
|
if assigned(Parent) then
|
|
Result := Parent.TreeDepth + 1;
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsBool: boolean;
|
|
begin
|
|
Result := sdStringToBool(FValue);
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsDateTime: TDateTime;
|
|
begin
|
|
Result := sdDateTimeFromString(ValueAsString, UseLocalBias);
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsFloat: double;
|
|
var
|
|
Code: integer;
|
|
begin
|
|
val(string(sdUTF8StringReplace(FValue, ',', '.')), Result, Code);
|
|
if Code > 0 then
|
|
raise Exception.Create(sxeCannotConvertToFloat);
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsInt64: int64;
|
|
begin
|
|
Result := StrToInt64(string(FValue));
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsInteger: integer;
|
|
begin
|
|
Result := StrToInt(string(FValue));
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsString: UTF8String;
|
|
begin
|
|
if FElementType = xeNormal then
|
|
Result := UnEscapeString(sdUTF8Trim(FValue))
|
|
else
|
|
Result := UnEscapeString(FValue);
|
|
end;
|
|
|
|
function TXmlNode.GetValueAsUnicodeString: UnicodeString;
|
|
begin
|
|
Result := ToUnicodeString(ValueAsString);
|
|
end;
|
|
|
|
function TXmlNode.GetWriteOnDefault: boolean;
|
|
begin
|
|
Result := True;
|
|
if assigned(Document) then
|
|
Result := Document.WriteOnDefault;
|
|
end;
|
|
|
|
function TXmlNode.HasAttribute(const AName: UTF8String): boolean;
|
|
begin
|
|
if assigned(FAttributes) then
|
|
Result := FAttributes.IndexOfName(AName) >= 0
|
|
else
|
|
Result := False;
|
|
end;
|
|
|
|
function TXmlNode.IndexInParent: integer;
|
|
// Retrieve our index in the parent's nodelist
|
|
begin
|
|
Result := -1;
|
|
if assigned(Parent) then
|
|
Result := Parent.FNodes.IndexOf(Self);
|
|
end;
|
|
|
|
function TXmlNode.IsClear: boolean;
|
|
begin
|
|
Result := (Length(FName) = 0) and IsEmpty;
|
|
end;
|
|
|
|
function TXmlNode.IsEmpty: boolean;
|
|
begin
|
|
Result := (Length(FValue) = 0) and (NodeCount = 0) and (AttributeCount = 0);
|
|
end;
|
|
|
|
function TXmlNode.IsEqualTo(ANode: TXmlNode; Options: TXmlCompareOptions;
|
|
MismatchNodes: TList): boolean;
|
|
var
|
|
i, Index: integer;
|
|
NodeResult, ChildResult: boolean;
|
|
begin
|
|
// Start with a negative result
|
|
Result := False;
|
|
NodeResult := False;
|
|
if not assigned(ANode) then
|
|
exit;
|
|
|
|
// Assume childs equals other node's childs
|
|
ChildResult := True;
|
|
|
|
// child node names and values - this comes first to assure the lists are filled
|
|
if (xcChildNames in Options) or (xcChildValues in Options) or (xcRecursive in Options) then
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
// Do child name check
|
|
Index := ANode.NodeIndexByName(Nodes[i].Name);
|
|
// Do we have the childnode in the other?
|
|
if Index < 0 then
|
|
begin
|
|
// No we dont have it
|
|
if xcChildNames in Options then
|
|
begin
|
|
if assigned(MismatchNodes) then MismatchNodes.Add(Nodes[i]);
|
|
ChildResult := False;
|
|
end;
|
|
end else
|
|
begin
|
|
// Do child value check
|
|
if xcChildValues in Options then
|
|
if UTF8CompareText(Nodes[i].ValueAsString, ANode.Nodes[Index].ValueAsString) <> 0 then
|
|
begin
|
|
if assigned(MismatchNodes) then
|
|
MismatchNodes.Add(Nodes[i]);
|
|
ChildResult := False;
|
|
end;
|
|
// Do recursive check
|
|
if xcRecursive in Options then
|
|
if not Nodes[i].IsEqualTo(ANode.Nodes[Index], Options, MismatchNodes) then
|
|
ChildResult := False;
|
|
end;
|
|
end;
|
|
|
|
try
|
|
// We assume there are differences
|
|
NodeResult := False;
|
|
|
|
// Node name, type and value
|
|
if xcNodeName in Options then
|
|
if UTF8CompareText(Name, ANode.Name) <> 0 then
|
|
exit;
|
|
|
|
if xcNodeType in Options then
|
|
if ElementType <> ANode.ElementType then
|
|
exit;
|
|
|
|
if xcNodeValue in Options then
|
|
if UTF8CompareText(ValueAsString, ANode.ValueAsString) <> 0 then
|
|
exit;
|
|
|
|
// attribute count
|
|
if xcAttribCount in Options then
|
|
if AttributeCount <> ANode.AttributeCount then
|
|
exit;
|
|
|
|
// attribute names and values
|
|
if (xcAttribNames in Options) or (xcAttribValues in Options) then
|
|
for i := 0 to AttributeCount - 1 do
|
|
begin
|
|
Index := ANode.AttributeIndexByName(AttributeName[i]);
|
|
if Index < 0 then
|
|
if xcAttribNames in Options then
|
|
exit
|
|
else
|
|
continue;
|
|
if xcAttribValues in Options then
|
|
if UTF8CompareText(AttributeValue[i], ANode.AttributeValue[Index]) <> 0 then
|
|
exit;
|
|
end;
|
|
|
|
// child node count
|
|
if xcChildCount in Options then
|
|
if NodeCount <> ANode.NodeCount then
|
|
exit;
|
|
|
|
// If we arrive here, it means no differences were found, return True
|
|
NodeResult := True;
|
|
|
|
finally
|
|
|
|
Result := ChildResult and NodeResult;
|
|
if (not NodeResult) and assigned(MismatchNodes) then
|
|
MismatchNodes.Insert(0, Self);
|
|
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.NodeAdd(ANode: TXmlNode): integer;
|
|
begin
|
|
if assigned(ANode) then
|
|
begin
|
|
ANode.Parent := Self;
|
|
ANode.ChangeDocument(Document);
|
|
if not assigned(FNodes) then
|
|
FNodes := TList.Create;
|
|
Result := FNodes.Add(ANode);
|
|
end else
|
|
Result := -1;
|
|
end;
|
|
|
|
function TXmlNode.NodeByAttributeValue(const NodeName, AttribName, AttribValue: UTF8String;
|
|
ShouldRecurse: boolean): TXmlNode;
|
|
// This function returns a pointer to the first subnode that has an attribute with
|
|
// name AttribName and value AttribValue.
|
|
var
|
|
i: integer;
|
|
Node: TXmlNode;
|
|
begin
|
|
Result := nil;
|
|
// Find all nodes that are potential results
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
Node := Nodes[i];
|
|
if (UTF8CompareText(Node.Name, NodeName) = 0) and
|
|
Node.HasAttribute(AttribName) and
|
|
(UTF8CompareText(Node.AttributeByName[AttribName], AttribValue) = 0) then
|
|
begin
|
|
Result := Node;
|
|
exit;
|
|
end;
|
|
// Recursive call
|
|
if ShouldRecurse then
|
|
Result := Node.NodeByAttributeValue(NodeName, AttribName, AttribValue, True);
|
|
if assigned(Result) then
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.NodeByElementType(ElementType: TXmlElementType): TXmlNode;
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := nil;
|
|
for i := 0 to NodeCount - 1 do
|
|
if Nodes[i].ElementType = ElementType then
|
|
begin
|
|
Result := Nodes[i];
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.NodeByName(const AName: UTF8String): TXmlNode;
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := nil;
|
|
for i := 0 to NodeCount - 1 do
|
|
if UTF8CompareText(Nodes[i].Name, AName) = 0 then
|
|
begin
|
|
Result := Nodes[i];
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.NodeDelete(Index: integer);
|
|
begin
|
|
if (Index >= 0) and (Index < NodeCount) then
|
|
begin
|
|
TXmlNode(FNodes[Index]).Free;
|
|
FNodes.Delete(Index);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.NodeExchange(Index1, Index2: integer);
|
|
begin
|
|
if (Index1 >= 0) and (Index1 < Nodecount) and
|
|
(Index2 >= 0) and (Index2 < Nodecount) then
|
|
FNodes.Exchange(Index1, Index2);
|
|
end;
|
|
|
|
function TXmlNode.NodeExtract(ANode: TXmlNode): TXmlNode;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
// Compatibility with Delphi4
|
|
Result := nil;
|
|
if assigned(FNodes) then
|
|
begin
|
|
Index := FNodes.IndexOf(ANode);
|
|
if Index >= 0 then begin
|
|
Result := ANode;
|
|
FNodes.Delete(Index);
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.NodeFindOrCreate(const AName: UTF8String): TXmlNode;
|
|
// Find the node with AName, and if not found, add new one
|
|
begin
|
|
Result := NodeByName(AName);
|
|
if not assigned(Result) then
|
|
Result := NodeNew(AName);
|
|
end;
|
|
|
|
function TXmlNode.NodeIndexByName(const AName: UTF8String): integer;
|
|
begin
|
|
Result := 0;
|
|
while Result < NodeCount do
|
|
begin
|
|
if UTF8CompareText(Nodes[Result].Name, AName) = 0 then
|
|
exit;
|
|
inc(Result);
|
|
end;
|
|
if Result = NodeCount then
|
|
Result := -1;
|
|
end;
|
|
|
|
function TXmlNode.NodeIndexByNameFrom(const AName: UTF8String; AFrom: integer): integer;
|
|
begin
|
|
Result := AFrom;
|
|
while Result < NodeCount do
|
|
begin
|
|
if UTF8CompareText(Nodes[Result].Name, AName) = 0 then
|
|
exit;
|
|
inc(Result);
|
|
end;
|
|
if Result = NodeCount then
|
|
Result := -1;
|
|
end;
|
|
|
|
function TXmlNode.NodeIndexOf(ANode: TXmlNode): integer;
|
|
begin
|
|
if assigned(ANode) and assigned(FNodes) then
|
|
Result := FNodes.IndexOf(ANode)
|
|
else
|
|
Result := -1;
|
|
end;
|
|
|
|
procedure TXmlNode.NodeInsert(Index: integer; ANode: TXmlNode);
|
|
// Insert the node ANode at location Index in the list.
|
|
begin
|
|
if not assigned(ANode) then
|
|
exit;
|
|
if (Index >=0) and (Index <= NodeCount) then
|
|
begin
|
|
if not assigned(FNodes) then
|
|
FNodes := TList.Create;
|
|
ANode.Parent := Self;
|
|
FNodes.Insert(Index, ANode);
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.NodeNew(const AName: UTF8String): TXmlNode;
|
|
// Add a new child node and return its pointer
|
|
begin
|
|
Result := Nodes[NodeAdd(TXmlNode.CreateName(Document, AName))];
|
|
end;
|
|
|
|
function TXmlNode.NodeNewAtIndex(Index: integer; const AName: UTF8String): TXmlNode;
|
|
// Create a new node with AName, and insert it into the subnode list at location
|
|
// Index, and return a pointer to it.
|
|
begin
|
|
if (Index >= 0) and (Index <= NodeCount) then
|
|
begin
|
|
Result := TXmlNode.CreateName(Document, AName);
|
|
NodeInsert(Index, Result);
|
|
end else
|
|
Result := nil;
|
|
end;
|
|
|
|
function TXmlNode.NodeRemove(ANode: TxmlNode): integer;
|
|
begin
|
|
Result := NodeIndexOf(ANode);
|
|
if Result >= 0 then
|
|
NodeDelete(Result);
|
|
end;
|
|
|
|
procedure TXmlNode.NodesByName(const AName: UTF8String; const AList: TList);
|
|
// Fill AList with nodes that have name AName
|
|
var
|
|
i: integer;
|
|
begin
|
|
if not assigned(AList) then
|
|
exit;
|
|
AList.Clear;
|
|
for i := 0 to NodeCount - 1 do
|
|
if UTF8CompareText(Nodes[i].Name, AName) = 0 then
|
|
AList.Add(Nodes[i]);
|
|
end;
|
|
|
|
procedure TXmlNode.NodesClear;
|
|
var
|
|
i: integer;
|
|
begin
|
|
for i := 0 to NodeCount - 1 do
|
|
TXmlNode(FNodes[i]).Free;
|
|
FreeAndNil(FNodes);
|
|
end;
|
|
|
|
procedure TXmlNode.ParseTag(const AValue: UTF8String; TagStart, TagClose: integer);
|
|
var
|
|
LItems: TsdUTF8StringList;
|
|
begin
|
|
// Create a list to hold string items
|
|
LItems := TsdUTF8StringList.Create;
|
|
try
|
|
sdUTF8ParseAttributes(AValue, TagStart, TagClose, LItems);
|
|
|
|
// Determine name, attributes or value for each element type
|
|
case ElementType of
|
|
xeDeclaration:
|
|
FName := 'xml';
|
|
xeStyleSheet:
|
|
begin
|
|
FName := 'xml-stylesheet';
|
|
// We also set this as the value for use in "StyleSheetString"
|
|
ValueDirect := sdUTF8Trim(copy(AValue, TagStart, TagClose - TagStart));
|
|
end;
|
|
else
|
|
// First item is the name - is it there?
|
|
if LItems.Count = 0 then
|
|
raise EFilerError.Create(sxeMissingElementName);
|
|
|
|
// Set the name - using the element instead of property for speed
|
|
FName := LItems[0];
|
|
LItems.Delete(0);
|
|
end;//case
|
|
|
|
// Any attributes?
|
|
if LItems.Count > 0 then
|
|
begin
|
|
CheckCreateAttributesList;
|
|
FAttributes.Assign(LItems);
|
|
end;
|
|
|
|
finally
|
|
LItems.Free;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.QualifyAsDirectNode: boolean;
|
|
// If this node qualifies as a direct node when writing, we return True.
|
|
// A direct node may have attributes, but no value or subnodes. Furhtermore,
|
|
// the root node will never be displayed as a direct node.
|
|
begin
|
|
Result :=
|
|
(Length(FValue) = 0) and
|
|
(NodeCount = 0) and
|
|
(ElementType = xeNormal) and
|
|
not UseFullNodes and
|
|
(TreeDepth > 0);
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeBool(const AName: UTF8String; ADefault: boolean): boolean;
|
|
var
|
|
V: UTF8String;
|
|
begin
|
|
Result := ADefault;
|
|
V := AttributeByName[AName];
|
|
if Length(V) = 0 then
|
|
exit;
|
|
|
|
try
|
|
Result := sdStringToBool(V);
|
|
except
|
|
Result := ADefault;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeDateTime(const AName: UTF8String; ADefault: TDateTime): TDateTime;
|
|
var
|
|
V: UTF8String;
|
|
begin
|
|
Result := ADefault;
|
|
V := AttributeByName[AName];
|
|
if Length(V) = 0 then
|
|
exit;
|
|
|
|
try
|
|
Result := sdDateTimeFromStringDefault(V, ADefault, UseLocalBias);
|
|
except
|
|
Result := ADefault;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeFloat(const AName: UTF8String; ADefault: double): double;
|
|
var
|
|
V: UTF8String;
|
|
Code: integer;
|
|
begin
|
|
V := AttributeByName[AName];
|
|
val(string(sdUTF8StringReplace(V, ',', '.')), Result, Code);
|
|
if Code > 0 then
|
|
Result := ADefault;
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeInteger(const AName: UTF8String; ADefault: integer): integer;
|
|
begin
|
|
Result := StrToIntDef(string(AttributeByName[AName]), ADefault);
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeInt64(const AName: UTF8String; ADefault: int64): int64;
|
|
begin
|
|
Result := StrToInt64Def(string(AttributeByName[AName]), ADefault);
|
|
end;
|
|
|
|
function TXmlNode.ReadAttributeString(const AName: UTF8String; const ADefault: UTF8String): UTF8String;
|
|
begin
|
|
Result := AttributeByName[AName];
|
|
if length(Result) = 0 then
|
|
Result := ADefault;
|
|
end;
|
|
|
|
function TXmlNode.ReadBool(const AName: UTF8String; ADefault: boolean): boolean;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := Nodes[Index].ValueAsBoolDef(ADefault);
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.ReadBrush(const AName: UTF8String; ABrush: TBrush);
|
|
var
|
|
Child: TXmlNode;
|
|
begin
|
|
Child := NodeByName(AName);
|
|
if assigned(Child) then with Child do
|
|
begin
|
|
// Read values
|
|
ABrush.Color := ReadColor('Color', clWhite);
|
|
ABrush.Style := TBrushStyle(ReadInteger('Style', integer(bsSolid)));
|
|
end else
|
|
begin
|
|
// Defaults
|
|
ABrush.Bitmap := nil;
|
|
ABrush.Color := clWhite;
|
|
ABrush.Style := bsSolid;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ReadColor(const AName: UTF8String; ADefault: TColor): TColor;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := StrToInt(string(Nodes[Index].ValueAsString));
|
|
end;
|
|
{$ENDIF}
|
|
|
|
function TXmlNode.ReadDateTime(const AName: UTF8String; ADefault: TDateTime): TDateTime;
|
|
// Date MUST always be written in this format:
|
|
// YYYY-MM-DD (if just date) or
|
|
// YYYY-MM-DDThh:mm:ss.sssZ (if date and time. The Z stands for universal time
|
|
// zone. Since Delphi's TDateTime does not give us a clue about the timezone,
|
|
// this is the easiest solution)
|
|
// This format SHOULD NOT be changed, to avoid all kinds of
|
|
// conversion errors in future.
|
|
// This format is compatible with the W3C date/time specification as found here:
|
|
// http://www.w3.org/TR/NOTE-datetime
|
|
begin
|
|
Result := sdDateTimeFromStringDefault(ReadString(AName, ''), ADefault, UseLocalBias);
|
|
end;
|
|
|
|
function TXmlNode.ReadFloat(const AName: UTF8String; ADefault: double): double;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := Nodes[Index].ValueAsFloatDef(ADefault);
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.ReadFont(const AName: UTF8String; AFont: TFont);
|
|
var
|
|
Child: TXmlNode;
|
|
begin
|
|
Child := NodeByName(AName);
|
|
AFont.Style := [];
|
|
if assigned(Child) then with Child do
|
|
begin
|
|
// Read values
|
|
AFont.Name := string(ReadString('Name', 'Arial'));
|
|
AFont.Color := ReadColor('Color', clBlack);
|
|
AFont.Size := ReadInteger('Size', 14);
|
|
if ReadBool('Bold', False) then AFont.Style := AFont.Style + [fsBold];
|
|
if ReadBool('Italic', False) then AFont.Style := AFont.Style + [fsItalic];
|
|
if ReadBool('Underline', False) then AFont.Style := AFont.Style + [fsUnderline];
|
|
if ReadBool('Strikeout', False) then AFont.Style := AFont.Style + [fsStrikeout];
|
|
end else
|
|
begin
|
|
// Defaults
|
|
AFont.Name := 'Arial';
|
|
AFont.Color := clBlack;
|
|
AFont.Size := 14;
|
|
end;
|
|
end;
|
|
{$ENDIF}
|
|
|
|
procedure TXmlNode.ReadFromStream(S: TStream);
|
|
// Read the node from the starting "<" until the closing ">" from the stream in S.
|
|
// This procedure also calls OnNodeNew and OnNodeLoaded events
|
|
var
|
|
Ch: AnsiChar;
|
|
i: integer;
|
|
TagIndex: integer;
|
|
V: UTF8String;
|
|
Len: integer;
|
|
Node: TXmlNode;
|
|
NodeValue: UTF8String;
|
|
ValuePos, ValueLen: integer;
|
|
ClosePos: integer;
|
|
HasCR: boolean;
|
|
HasSubtags: boolean;
|
|
Words: TsdUTF8StringList;
|
|
IsDirect: boolean;
|
|
Reader: TsdSurplusReader;
|
|
// local
|
|
procedure AddCharDataNode(PreserveWhiteSpace: boolean);
|
|
var
|
|
V: UTF8String;
|
|
Node: TXmlNode;
|
|
L: integer;
|
|
begin
|
|
// Add all text up till now as xeCharData
|
|
if ValuePos > 0 then
|
|
begin
|
|
V := copy(NodeValue, 1, ValuePos);
|
|
|
|
if PreserveWhiteSpace then
|
|
L := length(V)
|
|
else
|
|
L := length(sdUTF8Trim(V));
|
|
|
|
if L > 0 then
|
|
begin
|
|
Node := TXmlNode.CreateType(Document, xeCharData);
|
|
Node.ValueDirect := V;
|
|
NodeAdd(Node);
|
|
end;
|
|
ValuePos := 0;
|
|
end;
|
|
end;
|
|
// Main
|
|
begin
|
|
// Check if we aborted parsing
|
|
if AbortParsing then
|
|
exit;
|
|
// Clear this node first
|
|
Clear;
|
|
// Initial reserve textual value: just 80 AnsiCharacters which is OK for most short values
|
|
ValuePos := 0;
|
|
ValueLen := 80;
|
|
SetLength(NodeValue, ValueLen);
|
|
HasCR := False;
|
|
HasSubTags := False;
|
|
Reader := TsdSurplusReader.Create(S);
|
|
try
|
|
// Trailing blanks/controls AnsiChars?
|
|
if not Reader.ReadCharSkipBlanks(Ch) then
|
|
exit;
|
|
|
|
// What is it?
|
|
if Ch = '<' then
|
|
begin
|
|
// A tag - which one?
|
|
TagIndex := ReadOpenTag(Reader);
|
|
if TagIndex >= 0 then
|
|
begin
|
|
try
|
|
ElementType := cTags[TagIndex].Style;
|
|
case ElementType of
|
|
xeNormal, xeDeclaration, xeStyleSheet:
|
|
begin
|
|
// These tags we will process
|
|
ReadStringFromStreamUntil(Reader, cTags[TagIndex].Close, V, True);
|
|
Len := length(V);
|
|
|
|
// Is it a direct tag?
|
|
IsDirect := False;
|
|
if (ElementType = xeNormal) and (Len > 0) then
|
|
if V[Len] = '/' then
|
|
begin
|
|
dec(Len);
|
|
IsDirect := True;
|
|
end;
|
|
ParseTag(V, 1, Len + 1);
|
|
|
|
// Here we know our name so good place to call OnNodeNew event
|
|
if assigned(Document) then
|
|
begin
|
|
Document.DoNodeNew(Self);
|
|
if AbortParsing then
|
|
exit;
|
|
end;
|
|
|
|
// Now the tag can be a direct close - in that case we're finished
|
|
if IsDirect or (ElementType in [xeDeclaration, xeStyleSheet]) then
|
|
exit;
|
|
|
|
// Process rest of tag
|
|
repeat
|
|
|
|
// Read AnsiCharacter from stream
|
|
if S.Read(Ch, 1) <> 1 then
|
|
raise EFilerError.CreateFmt(sxeMissingCloseTag, [Name]);
|
|
|
|
// Is there a subtag?
|
|
if Ch = '<' then
|
|
begin
|
|
if not Reader.ReadCharSkipBlanks(Ch) then
|
|
raise EFilerError.CreateFmt(sxeMissingDataAfterGreaterThan, [Name]);
|
|
if Ch = '/' then
|
|
begin
|
|
|
|
// This seems our closing tag
|
|
if not ReadStringFromStreamUntil(Reader, '>', V, True) then
|
|
raise EFilerError.CreateFmt(sxeMissingLessThanInCloseTag, [Name]);
|
|
if UTF8CompareText(sdUTF8Trim(V), Name) <> 0 then
|
|
raise EFilerError.CreateFmt(sxeIncorrectCloseTag, [Name]);
|
|
V := '';
|
|
break;
|
|
|
|
end else
|
|
begin
|
|
|
|
// Add all text up till now as xeCharData
|
|
AddCharDataNode(False);
|
|
|
|
// Reset the HasCR flag if we add node, we only want to detect
|
|
// the CR after last subnode
|
|
HasCR := False;
|
|
|
|
// This is a subtag... so create it and let it process
|
|
HasSubTags := True;
|
|
S.Seek(-2, soCurrent);
|
|
Node := TXmlNode.Create(Document);
|
|
NodeAdd(Node);
|
|
Node.ReadFromStream(S);
|
|
|
|
// Check for dropping comments
|
|
if assigned(Document) and Document.DropCommentsOnParse and
|
|
(Node.ElementType = xeComment) then
|
|
NodeDelete(NodeIndexOf(Node));
|
|
|
|
end;
|
|
end else
|
|
begin
|
|
|
|
// If we detect a CR we will set the flag. This will signal the fact
|
|
// that this XML file was saved with xfReadable
|
|
if Ch = #13 then
|
|
HasCR := True;
|
|
|
|
// Add the AnsiCharacter to the node value buffer.
|
|
inc(ValuePos);
|
|
if ValuePos > ValueLen then
|
|
begin
|
|
inc(ValueLen, cNodeValueBuf);
|
|
SetLength(NodeValue, ValueLen);
|
|
end;
|
|
NodeValue[ValuePos] := Ch;
|
|
|
|
end;
|
|
until False or AbortParsing;
|
|
|
|
// Add all text up till now as xeText
|
|
AddCharDataNode(not HasSubtags);
|
|
|
|
// Check AnsiCharData nodes, remove trailing CRLF + indentation if we
|
|
// were in xfReadable mode
|
|
if HasSubtags and HasCR then
|
|
begin
|
|
for i := 0 to NodeCount - 1 do
|
|
if Nodes[i].ElementType = xeCharData then
|
|
begin
|
|
ClosePos := length(Nodes[i].FValue);
|
|
while (ClosePos > 0) and (Nodes[i].FValue[ClosePos] in [#10, #13, ' ']) do
|
|
dec(ClosePos);
|
|
Nodes[i].FValue := copy(Nodes[i].FValue, 1, ClosePos);
|
|
end;
|
|
end;
|
|
|
|
// If the first node is xeCharData we use it as ValueDirect
|
|
if NodeCount > 0 then
|
|
if Nodes[0].ElementType = xeCharData then
|
|
begin
|
|
ValueDirect := Nodes[0].ValueDirect;
|
|
NodeDelete(0);
|
|
end;
|
|
|
|
end;
|
|
xeDocType:
|
|
begin
|
|
Name := 'DTD';
|
|
if assigned(Document) then
|
|
begin
|
|
Document.DoNodeNew(Self);
|
|
if AbortParsing then
|
|
exit;
|
|
end;
|
|
// Parse DTD
|
|
if assigned(Document) then
|
|
Document.ParseDTD(Self, S);
|
|
end;
|
|
xeElement, xeAttList, xeEntity, xeNotation:
|
|
begin
|
|
// DTD elements
|
|
ReadStringFromStreamWithQuotes(S, cTags[TagIndex].Close, V);
|
|
Len := length(V);
|
|
Words := TsdUTF8StringList.Create;
|
|
try
|
|
sdUTF8ParseAttributes(V, 1, Len + 1, Words);
|
|
if Words.Count > 0 then
|
|
begin
|
|
Name := Words[0];
|
|
Words.Delete(0);
|
|
end;
|
|
ValueDirect := sdUTF8Trim(Words.Text);
|
|
finally
|
|
Words.Free;
|
|
end;
|
|
if assigned(Document) then
|
|
begin
|
|
Document.DoNodeNew(Self);
|
|
if AbortParsing then
|
|
exit;
|
|
end;
|
|
end;
|
|
else
|
|
case ElementType of
|
|
xeComment: Name := 'Comment';
|
|
xeCData: Name := 'CData';
|
|
xeExclam: Name := 'Special';
|
|
xeQuestion: Name := 'Special';
|
|
else
|
|
Name := 'Unknown';
|
|
end; //case
|
|
|
|
// Here we know our name so good place to call OnNodeNew
|
|
if assigned(Document) then
|
|
begin
|
|
Document.DoNodeNew(Self);
|
|
if AbortParsing then
|
|
exit;
|
|
end;
|
|
|
|
// In these cases just get all data up till the closing tag
|
|
ReadStringFromStreamUntil(Reader, cTags[TagIndex].Close, V, False);
|
|
ValueDirect := V;
|
|
end;//case
|
|
finally
|
|
// Call the OnNodeLoaded and OnProgress events
|
|
if assigned(Document) and not AbortParsing then
|
|
begin
|
|
Document.DoProgress(S.Position);
|
|
Document.DoNodeLoaded(Self);
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
finally
|
|
Reader.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.ReadFromString(const AValue: UTF8String);
|
|
var
|
|
S: TStream;
|
|
begin
|
|
S := TsdUTF8StringStream.Create(AValue);
|
|
try
|
|
ReadFromStream(S);
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ReadInt64(const AName: UTF8String; ADefault: int64): int64;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := Nodes[Index].ValueAsInt64Def(ADefault);
|
|
end;
|
|
|
|
function TXmlNode.ReadInteger(const AName: UTF8String; ADefault: integer): integer;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := Nodes[Index].ValueAsIntegerDef(ADefault);
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.ReadPen(const AName: UTF8String; APen: TPen);
|
|
var
|
|
Child: TXmlNode;
|
|
begin
|
|
Child := NodeByName(AName);
|
|
if assigned(Child) then with Child do
|
|
begin
|
|
// Read values
|
|
APen.Color := ReadColor('Color', clBlack);
|
|
APen.Mode := TPenMode(ReadInteger('Mode', integer(pmCopy)));
|
|
APen.Style := TPenStyle(ReadInteger('Style', integer(psSolid)));
|
|
APen.Width := ReadInteger('Width', 1);
|
|
end else
|
|
begin
|
|
// Defaults
|
|
APen.Color := clBlack;
|
|
APen.Mode := pmCopy;
|
|
APen.Style := psSolid;
|
|
APen.Width := 1;
|
|
end;
|
|
end;
|
|
{$ENDIF}
|
|
|
|
function TXmlNode.ReadString(const AName: UTF8String; const ADefault: UTF8String): UTF8String;
|
|
var
|
|
Index: integer;
|
|
begin
|
|
Result := ADefault;
|
|
Index := NodeIndexByName(AName);
|
|
if Index >= 0 then
|
|
Result := Nodes[Index].ValueAsString;
|
|
end;
|
|
|
|
function TXmlNode.ReadUnicodeString(const AName: UTF8String; const ADefault: UnicodeString): UnicodeString;
|
|
begin
|
|
Result := ToUnicodeString(ReadString(AName, FromUnicodeString(ADefault)));
|
|
end;
|
|
|
|
procedure TXmlNode.ResolveEntityReferences;
|
|
// Replace any entity references by the entities, and parse the new content if any
|
|
// local
|
|
function SplitReference(const AValue: UTF8String; var Text1, Text2: UTF8String): UTF8String;
|
|
var
|
|
P: integer;
|
|
begin
|
|
Result := '';
|
|
P := UTF8Pos('&', AValue);
|
|
Text1 := '';
|
|
Text2 := AValue;
|
|
if P = 0 then
|
|
exit;
|
|
Text1 := copy(AValue, 1, P - 1);
|
|
Text2 := copy(AValue, P + 1, length(AValue));
|
|
P := UTF8Pos(';', Text2);
|
|
if P = 0 then
|
|
exit;
|
|
Result := copy(Text2, 1, P - 1);
|
|
Text2 := copy(Text2, P + 1, length(Text2));
|
|
end;
|
|
// local
|
|
function ReplaceEntityReferenceByNodes(ARoot: TXmlNode; const AValue: UTF8String; var InsertPos: integer; var Text1, Text2: UTF8String): boolean;
|
|
var
|
|
Reference: UTF8String;
|
|
Entity: UTF8String;
|
|
Node: TXmlNode;
|
|
S: TStream;
|
|
begin
|
|
Result := False;
|
|
Reference := SplitReference(AValue, Text1, Text2);
|
|
if (length(Reference) = 0) or not assigned(Document) then
|
|
exit;
|
|
|
|
// Lookup entity references
|
|
Entity := Document.EntityByName[Reference];
|
|
|
|
// Does the entity contain markup?
|
|
if (length(Entity) > 0) and (UTF8Pos('<', Entity) > 0) then
|
|
begin
|
|
S := TsdUTF8StringStream.Create(Entity);
|
|
try
|
|
while S.Position < S.Size do
|
|
begin
|
|
Node := TXmlNode.Create(Document);
|
|
Node.ReadFromStream(S);
|
|
if Node.IsEmpty then
|
|
Node.Free
|
|
else
|
|
begin
|
|
ARoot.NodeInsert(InsertPos, Node);
|
|
inc(InsertPos);
|
|
Result := True;
|
|
end;
|
|
end;
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
end;
|
|
// main
|
|
var
|
|
i: integer;
|
|
InsertPos: integer;
|
|
Text1, Text2: UTF8String;
|
|
Node: TXmlNode;
|
|
V, Reference, Replace, Entity, First, Last: UTF8String;
|
|
begin
|
|
if length(FValue) > 0 then
|
|
begin
|
|
// Different behaviour for xeNormal and xeCharData
|
|
if ElementType = xeNormal then
|
|
begin
|
|
InsertPos := 0;
|
|
if ReplaceEntityReferenceByNodes(Self, FValue, InsertPos, Text1, Text2) then
|
|
begin
|
|
FValue := Text1;
|
|
if length(sdUTF8Trim(Text2)) > 0 then
|
|
begin
|
|
Node := TXmlNode.CreateType(Document, xeCharData);
|
|
Node.ValueDirect := Text2;
|
|
NodeInsert(InsertPos, Node);
|
|
end;
|
|
end;
|
|
end else if (ElementType = xeCharData) and assigned(Parent) then
|
|
begin
|
|
InsertPos := Parent.NodeIndexOf(Self);
|
|
if ReplaceEntityReferenceByNodes(Parent, FValue, InsertPos, Text1, Text2) then
|
|
begin
|
|
FValue := Text1;
|
|
if length(sdUTF8Trim(FValue)) = 0 then
|
|
FValue := '';
|
|
if length(sdUTF8Trim(Text2)) > 0 then
|
|
begin
|
|
Node := TXmlNode.CreateType(Document, xeCharData);
|
|
Node.ValueDirect := Text2;
|
|
Parent.NodeInsert(InsertPos, Node);
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
// Do attributes
|
|
for i := 0 to AttributeCount - 1 do
|
|
begin
|
|
Last := AttributeValue[i];
|
|
V := '';
|
|
repeat
|
|
Reference := SplitReference(Last, First, Last);
|
|
Replace := '';
|
|
if length(Reference) > 0 then
|
|
begin
|
|
Entity := Document.EntityByName[Reference];
|
|
if length(Entity) > 0 then
|
|
Replace := Entity
|
|
else
|
|
Replace := '&' + Reference + ';';
|
|
end;
|
|
V := V + First + Replace;
|
|
until length(Reference) = 0;
|
|
V := V + Last;
|
|
AttributeValue[i] := V;
|
|
end;
|
|
|
|
// Do childnodes too
|
|
i := 0;
|
|
while i < NodeCount do
|
|
begin
|
|
Nodes[i].ResolveEntityReferences;
|
|
inc(i);
|
|
end;
|
|
|
|
// Check for empty AnsiCharData nodes
|
|
for i := NodeCount - 1 downto 0 do
|
|
if (Nodes[i].ElementType = xeCharData) and (length(Nodes[i].ValueDirect) = 0) then
|
|
NodeDelete(i);
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeByName(const AName, Value: UTF8String);
|
|
begin
|
|
CheckCreateAttributesList;
|
|
FAttributes.Values[AName] := sdUTF8QuotedString(sdUTF8EscapeString(Value));
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeByNameWide(const AName: UTF8String; const Value: UnicodeString);
|
|
begin
|
|
SetAttributeByName(AName, FromUnicodeString(Value));
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeName(Index: integer; const Value: UTF8String);
|
|
var
|
|
S: UTF8String;
|
|
P: integer;
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
begin
|
|
S := FAttributes[Index];
|
|
P := Utf8Pos('=', S);
|
|
if P > 0 then
|
|
FAttributes[Index] := Value + '=' + Copy(S, P + 1, MaxInt);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeValue(Index: integer; const Value: UTF8String);
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
FAttributes[Index] := AttributeName[Index] + '=' +
|
|
sdUTF8QuotedString(sdUTF8EscapeString(Value));
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeValueAsInteger(Index: integer; const Value: integer);
|
|
begin
|
|
SetAttributeValue(Index, IntToUTF8Str(Value));
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeValueAsUnicodeString(Index: integer;
|
|
const Value: UnicodeString);
|
|
begin
|
|
SetAttributeValue(Index, FromUnicodeString(Value));
|
|
end;
|
|
|
|
procedure TXmlNode.SetAttributeValueDirect(Index: integer; const Value: UTF8String);
|
|
begin
|
|
if (Index >= 0) and (Index < AttributeCount) then
|
|
FAttributes[Index] := AttributeName[Index] + '=' +
|
|
sdUTF8QuotedString(Value);
|
|
end;
|
|
|
|
procedure TXmlNode.SetBinaryEncoding(const Value: TBinaryEncodingType);
|
|
begin
|
|
if assigned(Document) then
|
|
Document.BinaryEncoding := Value;
|
|
end;
|
|
|
|
procedure TXmlNode.SetBinaryString(const Value: RawByteString);
|
|
var
|
|
OldEncoding: TBinaryEncodingType;
|
|
begin
|
|
// Set to base64
|
|
OldEncoding := BinaryEncoding;
|
|
try
|
|
BinaryEncoding := xbeBase64;
|
|
if length(Value) = 0 then
|
|
begin
|
|
ValueAsString := '';
|
|
exit;
|
|
end;
|
|
// fill the buffer
|
|
{$IFDEF CLR}
|
|
BufferWrite(BytesOf(Value), length(Value));
|
|
{$ELSE}
|
|
BufferWrite(Value[1], length(Value));
|
|
{$ENDIF}
|
|
finally
|
|
BinaryEncoding := OldEncoding;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.SetName(const Value: UTF8String);
|
|
var
|
|
i: integer;
|
|
begin
|
|
if FName <> Value then
|
|
begin
|
|
// Check if the name abides the rules. We will be very forgiving here and
|
|
// just accept any name that at least does not contain control AnsiCharacters
|
|
for i := 1 to length(Value) do
|
|
if Value[i] in cControlChars then
|
|
raise Exception.Create(Format(sxeIllegalCharInNodeName, [Value]));
|
|
FName := Value;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsBool(const Value: boolean);
|
|
begin
|
|
FValue := sdStringFromBool(Value);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsDateTime(const Value: TDateTime);
|
|
begin
|
|
ValueAsString := sdDateTimeToString(Value, UseLocalBias);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsFloat(const Value: double);
|
|
begin
|
|
FValue := sdWriteNumber(Value, FloatSignificantDigits, FloatAllowScientific);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsInt64(const Value: int64);
|
|
begin
|
|
FValue := Int64ToUTF8Str(Value);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsInteger(const Value: integer);
|
|
begin
|
|
FValue := IntToUTF8Str(Value);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsString(const AValue: UTF8String);
|
|
begin
|
|
FValue := sdUTF8EscapeString(AValue);
|
|
end;
|
|
|
|
procedure TXmlNode.SetValueAsUnicodeString(const Value: UnicodeString);
|
|
begin
|
|
ValueAsString := FromUnicodeString(Value);
|
|
end;
|
|
|
|
procedure TXmlNode.SortChildNodes(Compare: TXMLNodeCompareFunction; Info: TPointer);
|
|
// Sort the child nodes using the quicksort algorithm
|
|
//local
|
|
function DoNodeCompare(Node1, Node2: TXmlNode): integer;
|
|
begin
|
|
if assigned(Compare) then
|
|
Result := Compare(Node1, Node2, Info)
|
|
else
|
|
if assigned(Document) and assigned(Document.OnNodeCompare) then
|
|
Result := Document.OnNodeCompare(Document, Node1, Node2, Info)
|
|
else
|
|
Result := UTF8CompareText(Node1.Name, Node2.Name);
|
|
end;
|
|
// local
|
|
procedure QuickSort(iLo, iHi: Integer);
|
|
var
|
|
Lo, Hi, Mid: longint;
|
|
begin
|
|
Lo := iLo;
|
|
Hi := iHi;
|
|
Mid:= (Lo + Hi) div 2;
|
|
repeat
|
|
while DoNodeCompare(Nodes[Lo], Nodes[Mid]) < 0 do
|
|
Inc(Lo);
|
|
while DoNodeCompare(Nodes[Hi], Nodes[Mid]) > 0 do
|
|
Dec(Hi);
|
|
if Lo <= Hi then
|
|
begin
|
|
// Swap pointers;
|
|
NodeExchange(Lo, Hi);
|
|
if Mid = Lo then
|
|
Mid := Hi
|
|
else
|
|
if Mid = Hi then
|
|
Mid := Lo;
|
|
Inc(Lo);
|
|
Dec(Hi);
|
|
end;
|
|
until Lo > Hi;
|
|
if Hi > iLo then
|
|
QuickSort(iLo, Hi);
|
|
if Lo < iHi then
|
|
QuickSort(Lo, iHi);
|
|
end;
|
|
// main
|
|
begin
|
|
if NodeCount > 1 then
|
|
QuickSort(0, NodeCount - 1);
|
|
end;
|
|
|
|
function TXmlNode.ToUnicodeString(const s: UTF8String): UnicodeString;
|
|
begin
|
|
Result := sdUtf8ToUnicode(s)
|
|
end;
|
|
|
|
function TXmlNode.UnescapeString(const AValue: UTF8String): UTF8String;
|
|
begin
|
|
Result := sdUTF8UnEscapeString(AValue)
|
|
end;
|
|
|
|
function TXmlNode.UseFullNodes: boolean;
|
|
begin
|
|
Result := False;
|
|
if assigned(Document) then
|
|
Result := Document.UseFullNodes;
|
|
end;
|
|
|
|
function TXmlNode.UseLocalBias: Boolean;
|
|
begin
|
|
Result := False;
|
|
if Assigned(Document) then
|
|
Result := Document.UseLocalBias;
|
|
end;
|
|
|
|
function TXmlNode.ValueAsBoolDef(ADefault: boolean): boolean;
|
|
var
|
|
Ch: AnsiChar;
|
|
begin
|
|
Result := ADefault;
|
|
if Length(FValue) = 0 then
|
|
exit;
|
|
Ch := sdUpCase(FValue[1]);
|
|
if Ch in ['T', 'Y'] then
|
|
begin
|
|
Result := True;
|
|
exit;
|
|
end;
|
|
if Ch in ['F', 'N'] then
|
|
begin
|
|
Result := False;
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ValueAsDateTimeDef(ADefault: TDateTime): TDateTime;
|
|
begin
|
|
Result := sdDateTimeFromStringDefault(ValueAsString, ADefault, UseLocalBias);
|
|
end;
|
|
|
|
function TXmlNode.ValueAsFloatDef(ADefault: double): double;
|
|
var
|
|
Code: integer;
|
|
begin
|
|
try
|
|
val(string(sdUTF8StringReplace(FValue, ',', '.')), Result, Code);
|
|
if Code > 0 then
|
|
Result := ADefault;
|
|
except
|
|
Result := ADefault;
|
|
end;
|
|
end;
|
|
|
|
function TXmlNode.ValueAsInt64Def(ADefault: int64): int64;
|
|
begin
|
|
Result := StrToInt64Def(string(FValue), ADefault);
|
|
end;
|
|
|
|
function TXmlNode.ValueAsIntegerDef(ADefault: integer): integer;
|
|
begin
|
|
Result := StrToIntDef(string(FValue), ADefault);
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeBool(const AName: UTF8String; AValue: boolean; ADefault: boolean);
|
|
var
|
|
Index: integer;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := sdStringFromBool(AValue)
|
|
else
|
|
AttributeAdd(AName, sdStringFromBool(AValue));
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeDateTime(const AName: UTF8String; AValue, ADefault: TDateTime);
|
|
var
|
|
Index: integer;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := sdDateTimeToString(AValue, UseLocalBias)
|
|
else
|
|
AttributeAdd(AName, sdDateTimeToString(AValue, UseLocalBias));
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeFloat(const AName: UTF8String; AValue, ADefault: double);
|
|
var
|
|
Index: integer;
|
|
S: UTF8String;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
S := sdWriteNumber(AValue, FloatSignificantDigits, FloatAllowScientific);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := S
|
|
else
|
|
AttributeAdd(AName, S);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeInteger(const AName: UTF8String; AValue: integer; ADefault: integer);
|
|
var
|
|
Index: integer;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := IntToUTF8Str(AValue)
|
|
else
|
|
AttributeAdd(AName, IntToUTF8Str(AValue));
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeInt64(const AName: UTF8String; const AValue: int64; ADefault: int64);
|
|
var
|
|
Index: integer;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := IntToUTF8Str(AValue)
|
|
else
|
|
AttributeAdd(AName, IntToUTF8Str(AValue));
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteAttributeString(const AName, AValue, ADefault: UTF8String);
|
|
var
|
|
Index: integer;
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
begin
|
|
Index := AttributeIndexByName(AName);
|
|
if Index >= 0 then
|
|
AttributeValue[Index] := AValue
|
|
else
|
|
AttributeAdd(AName, AValue);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteBool(const AName: UTF8String; AValue: boolean; ADefault: boolean);
|
|
const
|
|
cBoolValues: array[boolean] of UTF8String = ('False', 'True');
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := cBoolValues[AValue];
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.WriteBrush(const AName: UTF8String; ABrush: TBrush);
|
|
begin
|
|
with NodeFindOrCreate(AName) do
|
|
begin
|
|
WriteColor('Color', ABrush.Color, clBlack);
|
|
WriteInteger('Style', integer(ABrush.Style), 0);
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteColor(const AName: UTF8String; AValue, ADefault: TColor);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
WriteHex(AName, ColorToRGB(AValue), 8, 0);
|
|
end;
|
|
{$ENDIF}
|
|
|
|
procedure TXmlNode.WriteDateTime(const AName: UTF8String; AValue, ADefault: TDateTime);
|
|
// Date MUST always be written in this format:
|
|
// YYYY-MM-DD (if just date) or
|
|
// YYYY-MM-DDThh:mm:ss.sssZ (if date and time. The Z stands for universal time
|
|
// zone. Since Delphi's TDateTime does not give us a clue about the timezone,
|
|
// this is the easiest solution)
|
|
// This format SHOULD NOT be changed, to avoid all kinds of
|
|
// conversion errors in future.
|
|
// This format is compatible with the W3C date/time specification as found here:
|
|
// http://www.w3.org/TR/NOTE-datetime
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
WriteString(AName, sdDateTimeToString(AValue, UseLocalBias), '');
|
|
end;
|
|
|
|
procedure TXmlNode.WriteFloat(const AName: UTF8String; AValue: double; ADefault: double);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := sdWriteNumber(AValue, FloatSignificantDigits, FloatAllowScientific);
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.WriteFont(const AName: UTF8String; AFont: TFont);
|
|
begin
|
|
with NodeFindOrCreate(AName) do
|
|
begin
|
|
WriteString('Name', UTF8String(AFont.Name), 'Arial');
|
|
WriteColor('Color', AFont.Color, clBlack);
|
|
WriteInteger('Size', AFont.Size, 14);
|
|
WriteBool('Bold', fsBold in AFont.Style, False);
|
|
WriteBool('Italic', fsItalic in AFont.Style, False);
|
|
WriteBool('Underline', fsUnderline in AFont.Style, False);
|
|
WriteBool('Strikeout', fsStrikeout in AFont.Style, False);
|
|
end;
|
|
end;
|
|
{$ENDIF}
|
|
|
|
procedure TXmlNode.WriteHex(const AName: UTF8String; AValue, Digits: integer; ADefault: integer);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := '$' + UTF8String(IntToHex(AValue, Digits));
|
|
end;
|
|
|
|
function TXmlNode.WriteInnerTag: UTF8String;
|
|
// Write the inner part of the tag, the one that contains the attributes
|
|
var
|
|
i: integer;
|
|
begin
|
|
Result := '';
|
|
// Attributes
|
|
for i := 0 to AttributeCount - 1 do
|
|
// Here we used to prevent empty attributes, but in fact, empty attributes
|
|
// should be allowed because sometimes they're required
|
|
Result := Result + ' ' + AttributePair[i];
|
|
// End of tag - direct nodes get an extra "/"
|
|
if QualifyAsDirectNode then
|
|
Result := Result + '/';
|
|
end;
|
|
|
|
procedure TXmlNode.WriteInt64(const AName: UTF8String; AValue, ADefault: int64);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := IntToUTF8Str(AValue);
|
|
end;
|
|
|
|
procedure TXmlNode.WriteInteger(const AName: UTF8String; AValue: integer; ADefault: integer);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := IntToUTF8Str(AValue);
|
|
end;
|
|
|
|
{$IFDEF USEGRAPHICS}
|
|
procedure TXmlNode.WritePen(const AName: UTF8String; APen: TPen);
|
|
begin
|
|
with NodeFindOrCreate(AName) do
|
|
begin
|
|
WriteColor('Color', APen.Color, clBlack);
|
|
WriteInteger('Mode', integer(APen.Mode), 0);
|
|
WriteInteger('Style', integer(APen.Style), 0);
|
|
WriteInteger('Width', APen.Width, 0);
|
|
end;
|
|
end;
|
|
{$ENDIF}
|
|
|
|
procedure TXmlNode.WriteString(const AName, AValue: UTF8String; const ADefault: UTF8String);
|
|
begin
|
|
if WriteOnDefault or (AValue <> ADefault) then
|
|
with NodeFindOrCreate(AName) do
|
|
ValueAsString := AValue;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteToStream(S: TStream);
|
|
var
|
|
i: integer;
|
|
Indent: UTF8String;
|
|
LFeed: UTF8String;
|
|
Line: UTF8String;
|
|
ThisNode, NextNode: TXmlNode;
|
|
AddLineFeed: boolean;
|
|
begin
|
|
Indent := GetIndent;
|
|
LFeed := GetLineFeed;
|
|
|
|
// Write indent
|
|
Line := Indent;
|
|
|
|
// Write the node - distinguish node type
|
|
case ElementType of
|
|
xeDeclaration: // XML declaration <?xml{declaration}?>
|
|
begin
|
|
// Explicitly delete empty attributes in the declaration,
|
|
// this is usually the encoding and we do not want encoding=""
|
|
// to show up
|
|
DeleteEmptyAttributes;
|
|
Line := Indent + '<?xml' + WriteInnerTag + '?>';
|
|
end;
|
|
xeStylesheet: // Stylesheet <?xml-stylesheet{stylesheet}?>
|
|
Line := Indent + '<?xml-stylesheet' + WriteInnerTag + '?>';
|
|
xeDoctype:
|
|
begin
|
|
if NodeCount = 0 then
|
|
Line := Indent + '<!DOCTYPE ' + Name + ' ' + ValueDirect + '>'
|
|
else
|
|
begin
|
|
Line := Indent + '<!DOCTYPE ' + Name + ' ' + ValueDirect + ' [' + LFeed;
|
|
sdUTF8WriteStringToStream(S, Line);
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
Nodes[i].WriteToStream(S);
|
|
sdUTF8WriteStringToStream(S, LFeed);
|
|
end;
|
|
Line := ']>';
|
|
end;
|
|
end;
|
|
xeElement:
|
|
Line := Indent + '<!ELEMENT ' + Name + ' ' + ValueDirect + '>';
|
|
xeAttList:
|
|
Line := Indent + '<!ATTLIST ' + Name + ' ' + ValueDirect + '>';
|
|
xeEntity:
|
|
Line := Indent + '<!ENTITY ' + Name + ' ' + ValueDirect + '>';
|
|
xeNotation:
|
|
Line := Indent + '<!NOTATION ' + Name + ' ' + ValueDirect + '>';
|
|
xeComment: // Comment <!--{comment}-->
|
|
Line := Indent + '<!--' + ValueDirect + '-->';
|
|
xeCData: // literal data <![CDATA[{data}]]>
|
|
Line := Indent + '<![CDATA[' + ValueDirect + ']]>';
|
|
xeExclam: // Any <!data>
|
|
Line := Indent + '<!' + ValueDirect + '>';
|
|
xeQuestion: // Any <?data?>
|
|
Line := Indent + '<?' + ValueDirect + '?>';
|
|
xeCharData:
|
|
Line := FValue;
|
|
xeUnknown: // Any <data>
|
|
Line := Indent + '<' + ValueDirect + '>';
|
|
xeNormal: // normal nodes (xeNormal)
|
|
begin
|
|
// Write tag
|
|
Line := Line + '<' + FName + WriteInnerTag + '>';
|
|
|
|
// Write value (if any)
|
|
Line := Line + FValue;
|
|
if (NodeCount > 0) then
|
|
// ..and a linefeed
|
|
Line := Line + LFeed;
|
|
|
|
sdUTF8WriteStringToStream(S, Line);
|
|
|
|
// Write child elements
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
ThisNode := Nodes[i];
|
|
NextNode := Nodes[i + 1];
|
|
ThisNode.WriteToStream(S);
|
|
AddLineFeed := True;
|
|
if ThisNode.ElementType = xeCharData then
|
|
AddLineFeed := False;
|
|
if assigned(NextNode) then
|
|
if NextNode.ElementType = xeCharData then
|
|
AddLineFeed := False;
|
|
if AddLineFeed then
|
|
sdUTF8WriteStringToStream(S, LFeed);
|
|
end;
|
|
|
|
// Write end tag
|
|
Line := '';
|
|
if not QualifyAsDirectNode then
|
|
begin
|
|
if NodeCount > 0 then
|
|
Line := Indent;
|
|
Line := Line + '</' + FName + '>';
|
|
end;
|
|
end;
|
|
else
|
|
raise EFilerError.Create(sxeIllegalElementType);
|
|
end;//case
|
|
sdUTF8WriteStringToStream(S, Line);
|
|
|
|
// Call the onprogress
|
|
if assigned(Document) then
|
|
Document.DoProgress(S.Position);
|
|
end;
|
|
|
|
function TXmlNode.WriteToString: UTF8String;
|
|
var
|
|
S: TsdUTF8StringStream;
|
|
begin
|
|
// We will simply call WriteToStream and collect the result as UTF8String using
|
|
// a string stream
|
|
S := TsdUTF8StringStream.Create('');
|
|
try
|
|
WriteToStream(S);
|
|
Result := S.DataString;
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TXmlNode.WriteUnicodeString(const AName: UTF8String;
|
|
const AValue: UnicodeString; const ADefault: UnicodeString);
|
|
begin
|
|
WriteString(AName, FromUnicodeString(AValue), FromUnicodeString(ADefault));
|
|
end;
|
|
|
|
{ TXmlNodeList }
|
|
|
|
function TXmlNodeList.ByAttribute(const AName, AValue: UTF8String): TXmlNode;
|
|
var
|
|
i: integer;
|
|
begin
|
|
for i := 0 to Count - 1 do
|
|
if UTF8CompareText(Items[i].AttributeByName[AName], AValue) = 0 then
|
|
begin
|
|
Result := Items[i];
|
|
exit;
|
|
end;
|
|
Result := nil;
|
|
end;
|
|
|
|
function TXmlNodeList.GetItems(Index: Integer): TXmlNode;
|
|
begin
|
|
Result := TXmlNode(Get(Index));
|
|
end;
|
|
|
|
procedure TXmlNodeList.SetItems(Index: Integer; const Value: TXmlNode);
|
|
begin
|
|
Put(Index, TPointer(Value));
|
|
end;
|
|
|
|
{ TNativeXml }
|
|
|
|
procedure TNativeXml.Assign(Source: TPersistent);
|
|
// local
|
|
procedure SetDocumentRecursively(ANode: TXmlNode; ADocument: TNativeXml);
|
|
var
|
|
i: integer;
|
|
begin
|
|
ANode.Document := ADocument;
|
|
for i := 0 to ANode.NodeCount - 1 do
|
|
SetDocumentRecursively(ANode.Nodes[i], ADocument);
|
|
end;
|
|
// main
|
|
begin
|
|
if Source is TNativeXml then
|
|
begin
|
|
// Copy private members
|
|
FBinaryEncoding := TNativeXml(Source).FBinaryEncoding;
|
|
FDropCommentsOnParse := TNativeXml(Source).FDropCommentsOnParse;
|
|
FExternalEncoding := TNativeXml(Source).FExternalEncoding;
|
|
FParserWarnings := TNativeXml(Source).FParserWarnings;
|
|
FIndentString := TNativeXml(Source).FIndentString;
|
|
FUseFullNodes := TNativeXml(Source).FUseFullNodes;
|
|
FUseLocalBias := TNativeXml(Source).FUseLocalBias;
|
|
FWriteOnDefault := TNativeXml(Source).FWriteOnDefault;
|
|
FXmlFormat := TNativeXml(Source).FXmlFormat;
|
|
// Assign root
|
|
FRootNodes.Assign(TNativeXml(Source).FRootNodes);
|
|
// Set Document property recursively
|
|
SetDocumentRecursively(FRootNodes, Self);
|
|
end else
|
|
if Source is TXmlNode then
|
|
begin
|
|
// Assign this node to the FRootNodes property
|
|
FRootNodes.Assign(Source);
|
|
// Set Document property recursively
|
|
SetDocumentRecursively(FRootNodes, Self);
|
|
end else
|
|
inherited;
|
|
end;
|
|
|
|
procedure TNativeXml.Clear;
|
|
var
|
|
Node: TXmlNode;
|
|
begin
|
|
// Reset defaults
|
|
SetDefaults;
|
|
// Clear root
|
|
FRootNodes.Clear;
|
|
// Build default items in RootNodes
|
|
// - first the declaration
|
|
Node := TXmlNode.CreateType(Self, xeDeclaration);
|
|
Node.Name := 'xml';
|
|
Node.AttributeAdd('version', cDefaultVersionString);
|
|
Node.AttributeAdd('encoding', cDefaultEncodingString);
|
|
FRootNodes.NodeAdd(Node);
|
|
// - then the root node
|
|
FRootNodes.NodeNew('');
|
|
end;
|
|
|
|
procedure TNativeXml.CopyFrom(Source: TNativeXml);
|
|
begin
|
|
if not assigned(Source) then
|
|
exit;
|
|
Assign(Source);
|
|
end;
|
|
|
|
constructor TNativeXml.Create;
|
|
begin
|
|
inherited Create;
|
|
FRootNodes := TXmlNode.Create(Self);
|
|
Clear;
|
|
end;
|
|
|
|
constructor TNativeXml.CreateName(const ARootName: UTF8String);
|
|
begin
|
|
Create;
|
|
Root.Name := ARootName;
|
|
end;
|
|
|
|
destructor TNativeXml.Destroy;
|
|
begin
|
|
FreeAndNil(FRootNodes);
|
|
inherited;
|
|
end;
|
|
|
|
procedure TNativeXml.DoNodeLoaded(Node: TXmlNode);
|
|
begin
|
|
if assigned(FOnNodeLoaded) then
|
|
FOnNodeLoaded(Self, Node);
|
|
end;
|
|
|
|
procedure TNativeXml.DoNodeNew(Node: TXmlNode);
|
|
begin
|
|
if assigned(FOnNodeNew) then
|
|
FOnNodeNew(Self, Node);
|
|
end;
|
|
|
|
procedure TNativeXml.DoProgress(Size: integer);
|
|
begin
|
|
if assigned(FOnProgress) then
|
|
FOnProgress(Self, Size);
|
|
end;
|
|
|
|
procedure TNativeXml.DoUnicodeLoss(Sender: TObject);
|
|
begin
|
|
if assigned(FOnUnicodeLoss) then
|
|
FOnUnicodeLoss(Self);
|
|
end;
|
|
|
|
function TNativeXml.GetCommentString: UTF8String;
|
|
// Get the first comment node, and return its value
|
|
var
|
|
Node: TXmlNode;
|
|
begin
|
|
Result := '';
|
|
Node := FRootNodes.NodeByElementType(xeComment);
|
|
if assigned(Node) then
|
|
Result := Node.ValueAsString;
|
|
end;
|
|
|
|
function TNativeXml.GetEncodingString: UTF8String;
|
|
begin
|
|
Result := '';
|
|
if FRootNodes.NodeCount > 0 then
|
|
if FRootNodes[0].ElementType = xeDeclaration then
|
|
Result := FRootNodes[0].AttributeByName['encoding'];
|
|
end;
|
|
|
|
function TNativeXml.GetEntityByName(AName: UTF8String): UTF8String;
|
|
var
|
|
i, j: integer;
|
|
begin
|
|
Result := '';
|
|
for i := 0 to FRootNodes.NodeCount - 1 do
|
|
if FRootNodes[i].ElementType = xeDoctype then with FRootNodes[i] do
|
|
begin
|
|
for j := 0 to NodeCount - 1 do
|
|
if (Nodes[j].ElementType = xeEntity) and (Nodes[j].Name = AName) then
|
|
begin
|
|
Result := sdUTF8UnQuotedString(sdUTF8Trim(Nodes[j].ValueDirect));
|
|
exit;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
function TNativeXml.GetRoot: TXmlNode;
|
|
begin
|
|
Result := FRootNodes.NodeByElementType(xeNormal);
|
|
end;
|
|
|
|
function TNativeXml.GetStyleSheetNode: TXmlNode;
|
|
begin
|
|
Result := FRootNodes.NodeByElementType(xeStylesheet);
|
|
if not assigned(Result) then
|
|
begin
|
|
// Add a stylesheet node as second one if none present
|
|
Result := TXmlNode.CreateType(Self, xeStyleSheet);
|
|
FRootNodes.NodeInsert(1, Result);
|
|
end;
|
|
end;
|
|
|
|
function TNativeXml.GetUtf8Encoded: boolean;
|
|
begin
|
|
Result := True;
|
|
end;
|
|
|
|
function TNativeXml.GetVersionString: UTF8String;
|
|
begin
|
|
Result := '';
|
|
if FRootNodes.NodeCount > 0 then
|
|
if FRootNodes[0].ElementType = xeDeclaration then
|
|
Result := FRootNodes[0].AttributeByName['version'];
|
|
end;
|
|
|
|
function TNativeXml.IsEmpty: boolean;
|
|
var
|
|
R: TXmlNode;
|
|
begin
|
|
Result := True;
|
|
R := GetRoot;
|
|
if assigned(R) then
|
|
Result := R.IsClear;
|
|
end;
|
|
|
|
function TNativeXml.LineFeed: UTF8String;
|
|
begin
|
|
case XmlFormat of
|
|
xfReadable:
|
|
Result := #13#10;
|
|
xfCompact:
|
|
Result := #10;
|
|
else
|
|
Result := #10;
|
|
end;//case
|
|
end;
|
|
|
|
procedure TNativeXml.LoadFromFile(const AFileName: string);
|
|
var
|
|
S: TStream;
|
|
begin
|
|
S := TFileStream.Create(AFileName, fmOpenRead or fmShareDenyWrite);
|
|
try
|
|
LoadFromStream(S);
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.LoadFromStream(Stream: TStream);
|
|
var
|
|
B: TsdBufferedReadStream;
|
|
begin
|
|
// Create buffer filter. Since we read from the original stream a buffer at a
|
|
// time, this speeds up the reading process for disk-based files.
|
|
B := TsdBufferedReadStream.Create(Stream, False);
|
|
try
|
|
// We will create a conversion stream as intermediate
|
|
FCodecStream := TsdUtf8Stream.Create(B);
|
|
try
|
|
// Connect events
|
|
FCodecStream.OnUnicodeLoss := DoUnicodeLoss;
|
|
// Read from stream
|
|
ReadFromStream(FCodecStream);
|
|
// Set our external encoding
|
|
FExternalEncoding := FCodecStream.Encoding;
|
|
finally
|
|
FreeAndNil(FCodecStream);
|
|
end;
|
|
finally
|
|
B.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.ParseDTD(ANode: TXmlNode; S: TStream);
|
|
// DTD parsing is quite different from normal node parsing so it is brought
|
|
// under in the main NativeXml object
|
|
// local
|
|
procedure ParseMarkupDeclarations;
|
|
var
|
|
Ch: AnsiChar;
|
|
begin
|
|
repeat
|
|
ANode.NodeNew('').ReadFromStream(S);
|
|
// Read AnsiCharacter, exit if none available
|
|
repeat
|
|
if S.Read(Ch, 1) = 0 then
|
|
exit;
|
|
// Read until end markup declaration or end
|
|
until not (Ch in cControlChars);
|
|
if Ch = ']' then
|
|
break;
|
|
S.Seek(-1, soCurrent);
|
|
until False;
|
|
end;
|
|
// main
|
|
var
|
|
Prework: UTF8String;
|
|
Ch: AnsiChar;
|
|
Words: TsdUTF8StringList;
|
|
begin
|
|
// Get the name and external ID
|
|
Prework := '';
|
|
repeat
|
|
// Read AnsiCharacter, exit if none available
|
|
if S.Read(Ch, 1) = 0 then
|
|
exit;
|
|
// Read until markup declaration or end
|
|
if Ch in ['[', '>'] then
|
|
break;
|
|
Prework := Prework + UTF8String(Ch);
|
|
until False;
|
|
Words := TsdUTF8StringList.Create;
|
|
try
|
|
sdUTF8ParseAttributes(Prework, 1, length(Prework) + 1, Words);
|
|
// First word is name
|
|
if Words.Count > 0 then
|
|
begin
|
|
ANode.Name := Words[0];
|
|
Words.Delete(0);
|
|
// Put the rest in the valuedirect
|
|
ANode.ValueDirect := sdUTF8Trim(sdUTF8StringReplace(Words.Text, #13#10, ' '));
|
|
end;
|
|
finally
|
|
Words.Free;
|
|
end;
|
|
|
|
if Ch = '[' then
|
|
begin
|
|
|
|
// Parse any !ENTITY nodes and such
|
|
ParseMarkupDeclarations;
|
|
|
|
// read final tag
|
|
repeat
|
|
if S.Read(Ch, 1) = 0 then
|
|
exit;
|
|
if Ch = '>' then
|
|
break;
|
|
until False;
|
|
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.ReadFromStream(S: TStream);
|
|
var
|
|
i: integer;
|
|
Node: TXmlNode;
|
|
Enc: UTF8String;
|
|
NormalCount, DeclarationCount,
|
|
DoctypeCount, CDataCount: integer;
|
|
NormalPos, DoctypePos: integer;
|
|
begin
|
|
FAbortParsing := False;
|
|
with FRootNodes do
|
|
begin
|
|
// Clear the old root nodes - we do not reset the defaults
|
|
Clear;
|
|
DoProgress(0);
|
|
repeat
|
|
Node := NodeNew('');
|
|
Node.ReadFromStream(S);
|
|
if AbortParsing then
|
|
exit;
|
|
|
|
// XML declaration
|
|
if Node.ElementType = xeDeclaration then
|
|
begin
|
|
if Node.HasAttribute('encoding') then
|
|
Enc := Node.AttributeByName['encoding']
|
|
else
|
|
FCodecStream.Encoding := seUTF8;
|
|
// Check encoding
|
|
if assigned(FCodecStream) and (AnsiUpperCase(string(Enc)) = 'UTF-8') then
|
|
FCodecStream.Encoding := seUTF8;
|
|
end;
|
|
// Skip clear nodes
|
|
if Node.IsClear then
|
|
NodeDelete(NodeCount - 1);
|
|
until S.Position >= S.Size;
|
|
DoProgress(S.Size);
|
|
|
|
// Do some checks
|
|
NormalCount := 0;
|
|
DeclarationCount := 0;
|
|
DoctypeCount := 0;
|
|
CDataCount := 0;
|
|
NormalPos := -1;
|
|
DoctypePos := -1;
|
|
for i := 0 to NodeCount - 1 do
|
|
begin
|
|
// Count normal elements - there may be only one
|
|
case Nodes[i].ElementType of
|
|
xeNormal:
|
|
begin
|
|
inc(NormalCount);
|
|
NormalPos := i;
|
|
end;
|
|
xeDeclaration: inc(DeclarationCount);
|
|
xeDoctype:
|
|
begin
|
|
inc(DoctypeCount);
|
|
DoctypePos := i;
|
|
end;
|
|
xeCData: inc(CDataCount);
|
|
end;//case
|
|
end;
|
|
|
|
// We *must* have a root node
|
|
if NormalCount = 0 then
|
|
raise EFilerError.Create(sxeNoRootElement);
|
|
|
|
// Do some validation if we allow parser warnings
|
|
if FParserWarnings then
|
|
begin
|
|
|
|
// Check for more than one root node
|
|
if NormalCount > 1 then
|
|
raise EFilerError.Create(sxeMoreThanOneRootElement);
|
|
|
|
// Check for more than one xml declaration
|
|
if DeclarationCount > 1 then
|
|
raise EFilerError.Create(sxeMoreThanOneDeclaration);
|
|
|
|
// Declaration must be first element if present
|
|
if DeclarationCount = 1 then
|
|
if Nodes[0].ElementType <> xeDeclaration then
|
|
raise EFilerError.Create(sxeDeclarationMustBeFirstElem);
|
|
|
|
// Check for more than one DTD
|
|
if DoctypeCount > 1 then
|
|
raise EFilerError.Create(sxeMoreThanOneDoctype);
|
|
|
|
// Check if DTD is after root, this is not allowed
|
|
if (DoctypeCount = 1) and (DoctypePos > NormalPos) then
|
|
raise EFilerError.Create(sxeDoctypeAfterRootElement);
|
|
|
|
// No CDATA in root allowed
|
|
if CDataCount > 0 then
|
|
raise EFilerError.Create(sxeCDataInRoot);
|
|
end;
|
|
end;//with
|
|
end;
|
|
|
|
procedure TNativeXml.ReadFromString(const AValue: UTF8String);
|
|
var
|
|
S: TStream;
|
|
begin
|
|
S := TsdUTF8StringStream.Create(AValue);
|
|
try
|
|
ReadFromStream(S);
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.ResolveEntityReferences;
|
|
begin
|
|
if assigned(Root) then
|
|
Root.ResolveEntityReferences;
|
|
end;
|
|
|
|
procedure TNativeXml.SaveToFile(const AFileName: string);
|
|
var
|
|
S: TStream;
|
|
begin
|
|
S := TFileStream.Create(AFileName, fmCreate);
|
|
try
|
|
SaveToStream(S);
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.SaveToStream(Stream: TStream);
|
|
var
|
|
B: TsdBufferedWriteStream;
|
|
begin
|
|
// Create buffer filter. Since we write a buffer at a time to the destination
|
|
// stream, this speeds up the writing process for disk-based files.
|
|
B := TsdBufferedWriteStream.Create(Stream, False);
|
|
try
|
|
// Create conversion stream
|
|
FCodecStream := TsdUtf8Stream.Create(B);
|
|
try
|
|
// Set External encoding
|
|
FCodecStream.Encoding := FExternalEncoding;
|
|
WriteToStream(FCodecStream);
|
|
finally
|
|
FreeAndNil(FCodecStream);
|
|
end;
|
|
finally
|
|
B.Free;
|
|
end;
|
|
end;
|
|
|
|
procedure TNativeXml.SetCommentString(const Value: UTF8String);
|
|
// Find first comment node and set it's value, otherwise add new comment node
|
|
// right below the xml declaration
|
|
var
|
|
Node: TXmlNode;
|
|
begin
|
|
Node := FRootNodes.NodeByElementType(xeComment);
|
|
if not assigned(Node) and (length(Value) > 0) then
|
|
begin
|
|
Node := TXmlNode.CreateType(Self, xeComment);
|
|
FRootNodes.NodeInsert(1, Node);
|
|
end;
|
|
if assigned(Node) then
|
|
Node.ValueAsString := Value;
|
|
end;
|
|
|
|
procedure TNativeXml.SetDefaults;
|
|
begin
|
|
// Defaults
|
|
FExternalEncoding := cDefaultExternalEncoding;
|
|
FXmlFormat := cDefaultXmlFormat;
|
|
FWriteOnDefault := cDefaultWriteOnDefault;
|
|
FBinaryEncoding := cDefaultBinaryEncoding;
|
|
FIndentString := cDefaultIndentString;
|
|
FDropCommentsOnParse := cDefaultDropCommentsOnParse;
|
|
FUseFullNodes := cDefaultUseFullNodes;
|
|
FUseLocalBias := cDefaultUseLocalBias;
|
|
FFloatAllowScientific := cDefaultFloatAllowScientific;
|
|
FFloatSignificantDigits := cDefaultFloatSignificantDigits;
|
|
FOnNodeNew := nil;
|
|
FOnNodeLoaded := nil;
|
|
end;
|
|
|
|
procedure TNativeXml.SetEncodingString(const Value: UTF8String);
|
|
var
|
|
Node: TXmlNode;
|
|
begin
|
|
if Value = GetEncodingString then
|
|
exit;
|
|
Node := FRootNodes[0];
|
|
if not assigned(Node) or (Node.ElementType <> xeDeclaration) then
|
|
begin
|
|
Node := TXmlNode.CreateType(Self, xeDeclaration);
|
|
FRootNodes.NodeInsert(0, Node);
|
|
end;
|
|
if assigned(Node) then
|
|
Node.AttributeByName['encoding'] := Value;
|
|
end;
|
|
|
|
procedure TNativeXml.SetVersionString(const Value: UTF8String);
|
|
var
|
|
Node: TXmlNode;
|
|
begin
|
|
if Value = GetVersionString then
|
|
exit;
|
|
Node := FRootNodes[0];
|
|
if not assigned(Node) or (Node.ElementType <> xeDeclaration) then
|
|
begin
|
|
if length(Value) > 0 then
|
|
begin
|
|
Node := TXmlNode.CreateType(Self, xeDeclaration);
|
|
FRootNodes.NodeInsert(0, Node);
|
|
end;
|
|
end;
|
|
if assigned(Node) then
|
|
Node.AttributeByName['version'] := Value;
|
|
end;
|
|
|
|
procedure TNativeXml.WriteToStream(S: TStream);
|
|
var
|
|
i: integer;
|
|
begin
|
|
if not assigned(Root) and FParserWarnings then
|
|
raise EFilerError.Create(sxeRootElementNotDefined);
|
|
|
|
DoProgress(0);
|
|
|
|
// write the root nodes
|
|
for i := 0 to FRootNodes.NodeCount - 1 do
|
|
begin
|
|
FRootNodes[i].WriteToStream(S);
|
|
sdUTF8WriteStringToStream(S, LineFeed);
|
|
end;
|
|
|
|
DoProgress(S.Size);
|
|
end;
|
|
|
|
function TNativeXml.WriteToString: UTF8String;
|
|
var
|
|
S: TsdUTF8StringStream;
|
|
begin
|
|
S := TsdUTF8StringStream.Create('');
|
|
try
|
|
WriteToStream(S);
|
|
Result := S.DataString;
|
|
finally
|
|
S.Free;
|
|
end;
|
|
end;
|
|
|
|
{ TsdCodecStream }
|
|
|
|
constructor TsdCodecStream.Create(AStream: TStream);
|
|
begin
|
|
inherited Create;
|
|
FStream := AStream;
|
|
end;
|
|
|
|
function TsdCodecStream.InternalRead(var Buffer{$IFDEF CLR}: array of Byte{$ENDIF}; Offset, Count: Longint): Longint;
|
|
// Read from FStream and pass back data
|
|
var
|
|
i, j: integer;
|
|
BOM: array[0..3] of byte;
|
|
BytesRead: integer;
|
|
Found: boolean;
|
|
begin
|
|
Result := 0;
|
|
if FMode = umUnknown then
|
|
begin
|
|
FMode := umRead;
|
|
// Check FStream
|
|
if not assigned(FStream) then
|
|
raise EStreamError.Create(sxeCodecStreamNotAssigned);
|
|
|
|
// Determine encoding
|
|
FEncoding := seAnsi;
|
|
BytesRead := FStream.Read(BOM, 4);
|
|
for i := 0 to cBomInfoCount - 1 do
|
|
begin
|
|
Found := True;
|
|
for j := 0 to Min(BytesRead, cBomInfo[i].Len) - 1 do
|
|
begin
|
|
if BOM[j] <> cBomInfo[i].BOM[j] then
|
|
begin
|
|
Found := False;
|
|
break;
|
|
end;
|
|
end;
|
|
if Found then
|
|
break;
|
|
end;
|
|
if Found then
|
|
begin
|
|
FEncoding := cBomInfo[i].Encoding;
|
|
FWriteBom := cBomInfo[i].HasBOM;
|
|
end else
|
|
begin
|
|
// Unknown.. default to this
|
|
FEncoding := seAnsi;
|
|
FWriteBom := False;
|
|
end;
|
|
|
|
// Some encodings are not supported (yet)
|
|
if FEncoding in [seUCS4BE, seUCS4_2143, seUCS4_3412, seEBCDIC] then
|
|
raise EStreamError.Create(sxeUnsupportedEncoding);
|
|
|
|
// Correct stream to start position
|
|
if FWriteBom then
|
|
FStream.Seek(cBomInfo[i].Len - BytesRead, soCurrent)
|
|
else
|
|
FStream.Seek(-BytesRead, soCurrent);
|
|
|
|
// Check if we must swap byte order
|
|
if FEncoding in [se16BitBE, seUTF16BE] then
|
|
FSwapByteOrder := True;
|
|
|
|
end;
|
|
|
|
// Check mode
|
|
if FMode <> umRead then
|
|
raise EStreamError.Create(sxeCannotReadCodecForWriting);
|
|
|
|
// Check count
|
|
if Count <> 1 then
|
|
raise EStreamError.Create(sxeCannotReadMultipeChar);
|
|
|
|
// Now finally read
|
|
TBytes(Buffer)[Offset] := ReadByte;
|
|
if TBytes(Buffer)[Offset] <> 0 then Result := 1;
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
function TsdCodecStream.Read(var Buffer: array of Byte; Offset, Count: Longint): Longint;
|
|
begin
|
|
Result := InternalRead(Buffer, Offset, Count);
|
|
end;
|
|
|
|
{$ELSE}
|
|
|
|
function TsdCodecStream.Read(var Buffer; Count: Longint): Longint;
|
|
begin
|
|
Result := InternalRead(Buffer, 0, Count);
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
function TsdCodecStream.ReadByte: byte;
|
|
begin
|
|
// default does nothing
|
|
Result := 0;
|
|
end;
|
|
|
|
function TsdCodecStream.InternalSeek(Offset: Longint; Origin: TSeekOrigin): Longint;
|
|
begin
|
|
Result := 0;
|
|
if FMode = umUnknown then
|
|
raise EStreamError.Create(sxeCannotSeekBeforeReadWrite);
|
|
|
|
if Origin = soCurrent then
|
|
begin
|
|
if Offset = 0 then
|
|
begin
|
|
// Position
|
|
Result := FStream.Position;
|
|
exit;
|
|
end;
|
|
if (FMode = umRead) and ((Offset = -1) or (Offset = -2)) then
|
|
begin
|
|
FBuffer := '';
|
|
case Offset of
|
|
-1: FStream.Seek(FPosMin1, soBeginning);
|
|
-2: FStream.Seek(FPosMin2, soBeginning);
|
|
end;//case
|
|
exit;
|
|
end;
|
|
end;
|
|
if (Origin = soEnd) and (Offset = 0) then
|
|
begin
|
|
// Size
|
|
Result := FStream.Size;
|
|
exit;
|
|
end;
|
|
// Ignore set position from beginning (used in Size command)
|
|
if Origin = soBeginning then
|
|
exit;
|
|
// Arriving here means we cannot do it
|
|
raise EStreamError.Create(sxeCannotPerformSeek);
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
function TsdCodecStream.Seek(const Offset: Int64; Origin: TSeekOrigin): Int64;
|
|
begin
|
|
Result := InternalSeek(Offset, Origin);
|
|
end;
|
|
|
|
{$ELSE}
|
|
|
|
function TsdCodecStream.Seek(Offset: Longint; Origin: Word): Longint;
|
|
begin
|
|
Result := InternalSeek(Offset, TSeekOrigin(Origin));
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
procedure TsdCodecStream.StorePrevPositions;
|
|
begin
|
|
FPosMin2 := FPosMin1;
|
|
FPosMin1 := FStream.Position;
|
|
end;
|
|
|
|
function TsdCodecStream.InternalWrite(const Buffer{$IFDEF CLR}: array of Byte{$ENDIF}; Offset, Count: Longint): Longint;
|
|
var
|
|
i: integer;
|
|
begin
|
|
if FMode = umUnknown then
|
|
begin
|
|
FMode := umWrite;
|
|
|
|
// Some encodings are not supported (yet)
|
|
if FEncoding in [seUCS4BE, seUCS4_2143, seUCS4_3412, seEBCDIC] then
|
|
raise EStreamError.Create(sxeUnsupportedEncoding);
|
|
|
|
// Find correct encoding info
|
|
for i := 0 to cBomInfoCount - 1 do
|
|
if cBomInfo[i].Encoding = FEncoding then
|
|
begin
|
|
// we do not write BOM if UTF8 since UTF8 is default
|
|
FWriteBom := cBomInfo[i].HasBOM and (FEncoding <> seUTF8);
|
|
break;
|
|
end;
|
|
|
|
// Write BOM
|
|
if FWriteBom then
|
|
FStream.WriteBuffer(cBomInfo[i].BOM, cBomInfo[i].Len);
|
|
|
|
// Check if we must swap byte order
|
|
if FEncoding in [se16BitBE, seUTF16BE] then
|
|
FSwapByteOrder := True;
|
|
end;
|
|
|
|
if FMode <> umWrite then
|
|
raise EStreamError.Create(sxeCannotWriteCodecForReading);
|
|
WriteBuf(Buffer, Offset, Count);
|
|
Result := Count;
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
function TsdCodecStream.Write(const Buffer: array of Byte; Offset, Count: Longint): Longint;
|
|
begin
|
|
Result := InternalWrite(Buffer, Offset, Count);
|
|
end;
|
|
|
|
{$ELSE}
|
|
|
|
function TsdCodecStream.Write(const Buffer; Count: Longint): Longint;
|
|
begin
|
|
Result := InternalWrite(Byte(Buffer), 0, Count);
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
procedure TsdCodecStream.WriteBuf(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Offset, Count: longint);
|
|
var
|
|
i: integer;
|
|
begin
|
|
// Default just writes out bytes one by one. We override this in descendants
|
|
// to provide faster writes for some modes
|
|
for i := 0 to Count - 1 do
|
|
{$IFDEF CLR}
|
|
WriteByte(Buffer[Offset + i]);
|
|
{$ELSE}
|
|
WriteByte(TBytes(Buffer)[Offset + i]);
|
|
{$ENDIF}
|
|
end;
|
|
|
|
procedure TsdCodecStream.WriteByte(const B: byte);
|
|
begin
|
|
// default does nothing
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
|
|
procedure TsdCodecStream.SetSize(NewSize: Int64);
|
|
begin
|
|
// default does nothing
|
|
end;
|
|
|
|
{$ENDIF}
|
|
|
|
{ TsdUtf8Stream }
|
|
|
|
function TsdUtf8Stream.ReadByte: byte;
|
|
var
|
|
B, B1, B2, B3: byte;
|
|
W: word;
|
|
SA: AnsiString;
|
|
begin
|
|
Result := 0;
|
|
|
|
// New AnsiCharacter?
|
|
if (Length(FBuffer) = 0) or (FBufferPos > length(FBuffer)) then
|
|
begin
|
|
StorePrevPositions;
|
|
FBufferPos := 1;
|
|
// Read another AnsiChar and put in buffer
|
|
case FEncoding of
|
|
seAnsi:
|
|
begin
|
|
// read one byte
|
|
B := 0;
|
|
FStream.Read(B, 1);
|
|
SA := AnsiChar(B);
|
|
// Convert to UTF8
|
|
FBuffer := sdAnsiToUtf8(SA);
|
|
end;
|
|
seUTF8:
|
|
begin
|
|
// Read one, two or three bytes in the buffer
|
|
B1 := 0;
|
|
FStream.Read(B1, 1);
|
|
FBuffer := AnsiChar(B1);
|
|
if (B1 and $80) > 0 then
|
|
begin
|
|
if (B1 and $20) <> 0 then
|
|
begin
|
|
B2 := 0;
|
|
FStream.Read(B2, 1);
|
|
FBuffer := FBuffer + UTF8String(AnsiChar(B2));
|
|
end;
|
|
B3 := 0;
|
|
FStream.Read(B3, 1);
|
|
FBuffer := FBuffer + UTF8String(AnsiChar(B3));
|
|
end;
|
|
end;
|
|
se16BitBE, se16BitLE, seUTF16BE, seUTF16LE:
|
|
begin
|
|
// Read two bytes
|
|
W := 0;
|
|
FStream.Read(W, 2);
|
|
// Swap byte order
|
|
if FSwapByteOrder then
|
|
W := swap(W);
|
|
// Convert to UTF8 in buffer
|
|
FBuffer := sdUnicodeToUtf8(UnicodeChar(W));
|
|
end;
|
|
else
|
|
raise EStreamError.Create(sxeUnsupportedEncoding);
|
|
end;//case
|
|
end;
|
|
|
|
// Now we have the buffer, so read
|
|
if (FBufferPos > 0) and (FBufferPos <= length(FBuffer)) then
|
|
Result := byte(FBuffer[FBufferPos]);
|
|
inc(FBufferPos);
|
|
end;
|
|
|
|
procedure TsdUtf8Stream.WriteBuf(const Buffer{$IFDEF CLR}: TBytes{$ENDIF}; Offset, Count: longint);
|
|
begin
|
|
case FEncoding of
|
|
seUtf8:
|
|
begin
|
|
// one on one
|
|
if StreamWrite(FStream, Buffer, Offset, Count) <> Count then
|
|
raise EStreamError.Create(sxeCannotWriteToOutputStream);
|
|
end
|
|
else
|
|
inherited;
|
|
end;//case
|
|
end;
|
|
|
|
procedure TsdUtf8Stream.WriteByte(const B: byte);
|
|
var
|
|
SA: AnsiString;
|
|
SW: UnicodeString;
|
|
MustWrite: boolean;
|
|
begin
|
|
case FEncoding of
|
|
seAnsi, se16BitBE, se16BitLE, seUTF16BE, seUTF16LE:
|
|
begin
|
|
MustWrite := True;
|
|
case Length(FBuffer) of
|
|
0:
|
|
begin
|
|
FBuffer := AnsiChar(B);
|
|
if (B and $80) <> 0 then
|
|
MustWrite := False;
|
|
end;
|
|
1:
|
|
begin
|
|
FBuffer := FBuffer + UTF8String(AnsiChar(B));
|
|
if (byte(FBuffer[1]) and $20) <> 0 then
|
|
MustWrite := False;
|
|
end;
|
|
2: FBuffer := FBuffer + UTF8String(AnsiChar(B));
|
|
end;
|
|
if MustWrite then
|
|
begin
|
|
if FEncoding = seAnsi then
|
|
begin
|
|
// Convert to ansi
|
|
SA := sdUtf8ToAnsi(FBuffer);
|
|
// write out
|
|
if length(SA) = 1 then
|
|
if FStream.Write(SA[1], 1) <> 1 then
|
|
raise EStreamError.Create(sxeCannotWriteToOutputStream);
|
|
end else
|
|
begin
|
|
// Convert to unicode
|
|
SW := sdUtf8ToUnicode(FBuffer);
|
|
// write out
|
|
if length(SW) = 1 then
|
|
if FStream.Write(SW[1], 2) <> 2 then
|
|
raise EStreamError.Create(sxeCannotWriteToOutputStream);
|
|
end;
|
|
FBuffer := '';
|
|
end;
|
|
end;
|
|
seUTF8:
|
|
begin
|
|
// Just a flat write of one byte
|
|
if FStream.Write(B, 1) <> 1 then
|
|
raise EStreamError.Create(sxeCannotWriteToOutputStream);
|
|
end;
|
|
else
|
|
raise EStreamError.Create(sxeUnsupportedEncoding);
|
|
end;//case
|
|
end;
|
|
|
|
{$IFDEF CLR}
|
|
{ TsdBufferedStream }
|
|
|
|
constructor TsdBufferedStream.Create(AStream: TStream; Owned: Boolean = False);
|
|
begin
|
|
inherited Create;
|
|
FStream := AStream;
|
|
FOwned := Owned;
|
|
end;
|
|
|
|
destructor TsdBufferedStream.Destroy;
|
|
begin
|
|
if FOwned then FreeAndNil(FStream);
|
|
inherited Destroy;
|
|
end;
|
|
|
|
function TsdBufferedStream.Read(var Buffer: array of Byte; Offset, Count: Longint): Longint;
|
|
begin
|
|
Result := FStream.Read(Buffer, Offset, Count);
|
|
end;
|
|
|
|
function TsdBufferedStream.Write(const Buffer: array of Byte; Offset, Count: Longint): Longint;
|
|
begin
|
|
Result := FStream.Write(Buffer, Offset, Count);
|
|
end;
|
|
|
|
function TsdBufferedStream.Seek(const Offset: Int64; Origin: TSeekOrigin): Int64;
|
|
begin
|
|
Result := FStream.Seek(Offset, Origin);
|
|
end;
|
|
|
|
procedure TsdBufferedStream.SetSize(NewSize: Int64);
|
|
begin
|
|
FStream.Size := NewSize;
|
|
end;
|
|
|
|
{$ELSE}
|
|
|
|
{ TsdBufferedReadStream }
|
|
|
|
const
|
|
cMaxBufferSize = $10000; // 65536 bytes in the buffer
|
|
|
|
procedure TsdBufferedReadStream.CheckPosition;
|
|
var
|
|
NewPage: integer;
|
|
FStartPos: longint;
|
|
begin
|
|
// Page and buffer position
|
|
NewPage := FPosition div cMaxBufferSize;
|
|
FBufPos := FPosition mod cMaxBufferSize;
|
|
|
|
// Read new page if required
|
|
if (NewPage <> FPage) then
|
|
begin
|
|
// New page and buffer
|
|
FPage := NewPage;
|
|
|
|
// Start position in stream
|
|
FStartPos := FPage * cMaxBufferSize;
|
|
FBufSize := Min(cMaxBufferSize, FStream.Size - FStartPos);
|
|
|
|
FStream.Seek(FStartPos, soBeginning);
|
|
if FBufSize > 0 then
|
|
FStream.Read(FBuffer^, FBufSize);
|
|
end;
|
|
FMustCheck := False;
|
|
end;
|
|
|
|
constructor TsdBufferedReadStream.Create(AStream: TStream; Owned: boolean);
|
|
begin
|
|
inherited Create;
|
|
FStream := AStream;
|
|
FOwned := Owned;
|
|
FMustCheck := True;
|
|
FPage := -1; // Set to invalid number to force an update on first read
|
|
ReallocMem(FBuffer, cMaxBufferSize);
|
|
end;
|
|
|
|
destructor TsdBufferedReadStream.Destroy;
|
|
begin
|
|
if FOwned then FreeAndNil(FStream);
|
|
ReallocMem(FBuffer, 0);
|
|
inherited;
|
|
end;
|
|
|
|
function TsdBufferedReadStream.Read(var Buffer; Count: longint): Longint;
|
|
var
|
|
Packet: PByte;
|
|
PacketCount: integer;
|
|
begin
|
|
// Set the right page
|
|
if FMustCheck then
|
|
CheckPosition;
|
|
|
|
// Special case - read one byte, most often
|
|
if (Count = 1) and (FBufPos < FBufSize - 1) then
|
|
begin
|
|
byte(Buffer) := FBuffer^[FBufPos];
|
|
inc(FBufPos);
|
|
inc(FPosition);
|
|
Result := 1;
|
|
exit;
|
|
end;
|
|
|
|
// general case
|
|
Packet := @Buffer;
|
|
Result := 0;
|
|
while Count > 0 do
|
|
begin
|
|
PacketCount := min(FBufSize - FBufPos, Count);
|
|
if PacketCount <= 0 then
|
|
exit;
|
|
Move(FBuffer^[FBufPos], Packet^, PacketCount);
|
|
dec(Count, PacketCount);
|
|
inc(Packet, PacketCount);
|
|
inc(Result, PacketCount);
|
|
inc(FPosition, PacketCount);
|
|
inc(FBufPos, PacketCount);
|
|
if FBufPos >= FBufSize then
|
|
CheckPosition;
|
|
end;
|
|
end;
|
|
|
|
function TsdBufferedReadStream.Seek(Offset: longint; Origin: Word): Longint;
|
|
begin
|
|
case Origin of
|
|
soFromBeginning:
|
|
FPosition := Offset;
|
|
soFromCurrent:
|
|
begin
|
|
// no need to check in this case - it is the GetPosition command
|
|
if Offset = 0 then
|
|
begin
|
|
Result := FPosition;
|
|
exit;
|
|
end;
|
|
FPosition := FPosition + Offset;
|
|
end;
|
|
soFromEnd:
|
|
FPosition := FStream.Size + Offset;
|
|
end;//case
|
|
Result := FPosition;
|
|
FMustCheck := True;
|
|
end;
|
|
|
|
function TsdBufferedReadStream.Write(const Buffer; Count: longint): Longint;
|
|
begin
|
|
raise EStreamError.Create(sxeCannotWriteCodecForReading);
|
|
end;
|
|
|
|
{ TsdBufferedWriteStream }
|
|
|
|
constructor TsdBufferedWriteStream.Create(AStream: TStream; Owned: boolean);
|
|
begin
|
|
inherited Create;
|
|
FStream := AStream;
|
|
FOwned := Owned;
|
|
ReallocMem(FBuffer, cMaxBufferSize);
|
|
end;
|
|
|
|
destructor TsdBufferedWriteStream.Destroy;
|
|
begin
|
|
Flush;
|
|
if FOwned then
|
|
FreeAndNil(FStream);
|
|
ReallocMem(FBuffer, 0);
|
|
inherited;
|
|
end;
|
|
|
|
procedure TsdBufferedWriteStream.Flush;
|
|
begin
|
|
// Write the buffer to the stream
|
|
if FBufPos > 0 then
|
|
begin
|
|
FStream.Write(FBuffer^, FBufPos);
|
|
FBufPos := 0;
|
|
end;
|
|
end;
|
|
|
|
function TsdBufferedWriteStream.Read(var Buffer; Count: longint): Longint;
|
|
begin
|
|
raise EStreamError.Create(sxeCannotReadCodecForWriting);
|
|
end;
|
|
|
|
function TsdBufferedWriteStream.Seek(Offset: longint; Origin: Word): Longint;
|
|
begin
|
|
case Origin of
|
|
soFromBeginning:
|
|
if Offset = FPosition then
|
|
begin
|
|
Result := FPosition;
|
|
exit;
|
|
end;
|
|
soFromCurrent:
|
|
begin
|
|
// GetPosition command
|
|
if Offset = 0 then
|
|
begin
|
|
Result := FPosition;
|
|
exit;
|
|
end;
|
|
end;
|
|
soFromEnd:
|
|
if Offset = 0 then
|
|
begin
|
|
Result := FPosition;
|
|
exit;
|
|
end;
|
|
end;//case
|
|
raise EStreamError.Create(sxeCannotPerformSeek);
|
|
end;
|
|
|
|
function TsdBufferedWriteStream.Write(const Buffer; Count: longint): Longint;
|
|
var
|
|
Packet: PByte;
|
|
PacketCount: integer;
|
|
begin
|
|
// Special case - read less bytes than would fill buffersize
|
|
if (FBufPos + Count < cMaxBufferSize) then
|
|
begin
|
|
Move(Buffer, FBuffer^[FBufPos], Count);
|
|
inc(FBufPos, Count);
|
|
inc(FPosition, Count);
|
|
Result := Count;
|
|
exit;
|
|
end;
|
|
|
|
// general case that wraps buffer
|
|
Packet := @Buffer;
|
|
Result := 0;
|
|
while Count > 0 do
|
|
begin
|
|
PacketCount := min(cMaxBufferSize - FBufPos, Count);
|
|
if PacketCount <= 0 then
|
|
exit;
|
|
Move(Packet^, FBuffer^[FBufPos], PacketCount);
|
|
dec(Count, PacketCount);
|
|
inc(Result, PacketCount);
|
|
inc(FPosition, PacketCount);
|
|
inc(Packet, PacketCount);
|
|
inc(FBufPos, PacketCount);
|
|
if FBufPos = cMaxBufferSize then
|
|
Flush;
|
|
end;
|
|
end;
|
|
{$ENDIF}
|
|
|
|
{ TsdSurplusReader }
|
|
|
|
constructor TsdSurplusReader.Create(AStream: TStream);
|
|
begin
|
|
inherited Create;
|
|
FStream := AStream;
|
|
end;
|
|
|
|
function TsdSurplusReader.ReadChar(var Ch: AnsiChar): integer;
|
|
begin
|
|
if length(FSurplus) > 0 then
|
|
begin
|
|
Ch := FSurplus[1];
|
|
FSurplus := copy(FSurplus, 2, length(FSurplus) - 1);
|
|
Result := 1;
|
|
end else
|
|
Result := FStream.Read(Ch, 1);
|
|
end;
|
|
|
|
function TsdSurplusReader.ReadCharSkipBlanks(var Ch: AnsiChar): boolean;
|
|
begin
|
|
Result := False;
|
|
repeat
|
|
// Read AnsiCharacter, exit if none available
|
|
if ReadChar(Ch) = 0 then
|
|
exit;
|
|
// Skip if in controlchars
|
|
if not (Ch in cControlchars) then
|
|
break;
|
|
until False;
|
|
Result := True;
|
|
end;
|
|
|
|
{ TsdStringBuilder }
|
|
|
|
procedure TsdStringBuilder.AddChar(Ch: AnsiChar);
|
|
begin
|
|
inc(FCurrentIdx);
|
|
Reallocate(FCurrentIdx);
|
|
FData[FCurrentIdx] := Ch;
|
|
end;
|
|
|
|
procedure TsdStringBuilder.AddString(var S: UTF8String);
|
|
var
|
|
{$IFDEF CLR}
|
|
i: integer;
|
|
{$ENDIF}
|
|
Count: integer;
|
|
begin
|
|
{$IFDEF CLR}
|
|
Count := S.Length;
|
|
{$ELSE}
|
|
Count := System.length(S);
|
|
{$ENDIF}
|
|
if Count = 0 then
|
|
exit;
|
|
Reallocate(FCurrentIdx + Count);
|
|
{$IFDEF CLR}
|
|
for i := 1 to S.Length do
|
|
FData[FCurrentIdx + i] := S[i];
|
|
{$ELSE}
|
|
Move(S[1], FData[FCurrentIdx + 1], Count);
|
|
{$ENDIF}
|
|
inc(FCurrentIdx, Count);
|
|
end;
|
|
|
|
procedure TsdStringBuilder.Clear;
|
|
begin
|
|
FCurrentIdx := 0;
|
|
end;
|
|
|
|
function TsdStringBuilder.StringCopy(AFirst, ALength: integer): UTF8String;
|
|
begin
|
|
if ALength > FCurrentIdx - AFirst + 1 then
|
|
ALength := FCurrentIdx - AFirst + 1;
|
|
Result := Copy(FData, AFirst, ALength);
|
|
end;
|
|
|
|
constructor TsdStringBuilder.Create;
|
|
begin
|
|
inherited Create;
|
|
SetLength(FData, 64);
|
|
end;
|
|
|
|
function TsdStringBuilder.GetData(Index: integer): AnsiChar;
|
|
begin
|
|
Result := FData[Index];
|
|
end;
|
|
|
|
procedure TsdStringBuilder.Reallocate(RequiredLength: integer);
|
|
begin
|
|
{$IFDEF CLR}
|
|
while FData.Length < RequiredLength do
|
|
SetLength(FData, FData.Length * 2);
|
|
{$ELSE}
|
|
while System.Length(FData) < RequiredLength do
|
|
SetLength(FData, System.Length(FData) * 2);
|
|
{$ENDIF}
|
|
end;
|
|
|
|
function TsdStringBuilder.Value: UTF8String;
|
|
begin
|
|
Result := Copy(FData, 1, FCurrentIdx);
|
|
end;
|
|
|
|
end.
|