The Binary Text Extractor configuration file, BinaryTextorConfig.xml, uses the following schema:
<?xml version="1.0" encoding="utf-8" ?> <xs:schema attributeFormDefault="unqualified" elementFormDefault="qualified" xmlns:xs="http://www.w3.org/2001/XMLSchema"> <!-- FileType Element Type --> <xs:complexType name="FileTypeType"> <xs:sequence> <xs:sequence minOccurs="1" maxOccurs="unbounded"> <xs:element name="MagicNumber" type="MagicNumberType" /> </xs:sequence> <xs:sequence minOccurs="1" maxOccurs="unbounded"> <xs:element name="Encoding" type="EncodingType" /> </xs:sequence> </xs:sequence> <!-- The magic number can be a hex string or a text string --> <xs:attribute name="name" type="xs:string" /> </xs:complexType> <!-- Top Level Element --> <xs:element name="UniversalBinaryTextor"> <xs:complexType> <xs:sequence> <xs:sequence maxOccurs="unbounded" minOccurs="0"> <xs:element name="FileType" type="FileTypeType" /> </xs:sequence> </xs:sequence> </xs:complexType> </xs:element> <!-- CharSet Element Type --> <xs:complexType name="CharSetType"> <!-- If both start and end are populated, these are used instead of 'name' --> <!-- 'start' and 'end' are in hex, prefixed with 0x eg, 0xF007 --> <xs:attribute name="start" type="xs:string" use="optional" /> <xs:attribute name="end" type="xs:string" use="optional" /> <!-- CharSet name can be any Block Name from http://www.unicode.org/Public/UNIDATA/Blocks.txt Case, spaces, hyphens and underbars are ignored when comparing block names --> <xs:attribute name="blockName" type="xs:string" use="optional" /> </xs:complexType> <!-- Supported Encodings --> <xs:simpleType name="EncodingEnumType"> <xs:restriction base="xs:string"> <xs:enumeration value="ASCII" /> <xs:enumeration value="UTF8" /> <xs:enumeration value="UTF16_LITTLEENDIAN" /> <xs:enumeration value="UTF16_BIGENDIAN" /> </xs:restriction> </xs:simpleType> <!-- Encoding Element Type --> <xs:complexType name="EncodingType"> <xs:sequence minOccurs="1" maxOccurs="unbounded"> <xs:element name="CharSet" type="CharSetType" /> </xs:sequence> <xs:attribute name="name" type="EncodingEnumType" use="required" /> <xs:attribute name="minLength" type="xs:unsignedByte" use="required" /> </xs:complexType> <xs:complexType name="MagicNumberType"> <xs:attribute name="value" type="xs:string" /> <xs:attribute name="type" type="MagicNumberTypeEnum" /> <xs:attribute name="offSet" type="xs:integer" /> </xs:complexType> <xs:simpleType name="MagicNumberTypeEnum"> <xs:restriction base="xs:string"> <xs:enumeration value="ascii-string" /> <xs:enumeration value="hex-string" /> </xs:restriction> </xs:simpleType> </xs:schema>
Copyright © 2014 CA.
All rights reserved.
|
|