File type identifiers
C#
public enum TypeId {
it_WordList = 104,
it_ContentAsXml = 108,
it_Ami = 201,
it_Ansi = 202,
it_Ascii = 203,
it_Binary = 204,
it_CompoundDoc = 205,
it_DBF = 206,
it_FilteredBinary = 207,
it_HyperText = 208,
it_MS_Word = 209,
it_MS_Works = 210,
it_Multimate = 211,
it_RTF = 212,
it_WS_2000 = 213,
it_WS_5 = 214,
it_WinWrite = 215,
it_WordForDos = 215,
it_WordForWin = 216,
it_WordForWin6 = 217,
it_WordPerfect42 = 218,
it_WordPerfect5 = 219,
it_WordPerfect6 = 220,
it_WordStar = 221,
it_XyWrite = 222,
it_ZIP = 223,
it_Properties = 224,
it_Excel5 = 225,
it_HTML = 226,
it_PDF = 227,
it_WordForWin97 = 228,
it_Excel97 = 229,
it_PowerPoint = 230,
it_EncryptedHtml = 231,
it_DatabaseRecord = 232,
it_SegmentedText = 233,
it_XML = 234,
it_WordPerfectEmbedded = 235,
it_Unicode = 236,
it_EudoraMessage = 237,
it_Utf8 = 238,
it_OutlookExpressMessage = 240,
it_MimeMessage = 241,
it_SingleByteText = 242,
it_MBoxArchive = 243,
it_FilteredBinaryUnicode = 244,
it_ZIP_zlib = 245,
it_OutlookMsgFile = 246,
it_TreepadHjtFile = 247,
it_PfsProfessionalWrite = 248,
it_FilteredBinaryUnicodeStream = 249,
it_DocFile = 250,
it_Media = 251,
it_NonTextData = 252,
it_EML = 253,
it_MicrosoftWord = 254,
it_UnformattedHTML = 256,
it_DatabaseRecord2 = 257,
it_Excel2003Xml = 258,
it_Word2003Xml = 259,
it_OpenOfficeDocument = 260,
it_CSV = 261,
it_MicrosoftAccess = 262,
it_XBase = 263,
it_OutlookExpressMessageStore = 264,
it_IFilter = 265,
it_Gzip = 266,
it_Excel4 = 267,
it_Word12 = 268,
it_Excel12 = 269,
it_PowerPoint12 = 270,
it_TNEF = 271,
it_XPS = 272,
it_WMF = 273,
it_EMF = 274,
it_TAR = 275,
it_Excel2 = 277,
it_Excel3 = 278,
it_MBoxArchive2 = 279,
it_Lotus123 = 280,
it_MsWorksWps4 = 281,
it_MsWorksWps6 = 282,
it_QuattroPro = 283,
it_QuattroPro8 = 284,
it_OutlookMsgAsContainer = 285,
it_MimeContainer = 286,
it_PdfWithAttachments = 287,
it_MicrosoftAccess2 = 288,
it_FlashSWF = 289,
it_RAR = 290,
it_NoContent = 291,
it_Excel12xlsb = 292,
it_XfaForm = 293,
it_MifFile = 294,
it_WordForWindows2 = 295,
it_ASF = 296,
it_MP3 = 297,
it_QuickTime = 298,
it_MP4 = 299,
it_M4A = 300,
it_MPG = 301,
it_JPEG = 302,
it_TIFF = 303,
it_MDI = 304,
it_GIF = 305,
it_PNG = 306,
it_CAB = 308,
it_dtSearchIndex = 309,
it_HtmlHelp = 310,
it_TrueTypeFont = 311,
it_WAV = 312,
it_BMP = 313,
it_AVI = 314,
it_Visio = 315,
it_Ichitaro = 316,
it_SolidWorks = 317,
it_Unigraphics = 318,
it_DWG = 319,
it_DWF = 320,
it_DXF = 321,
it_VisioXml = 322,
it_WordForWindows1 = 323,
it_OutlookPst = 324,
it_MicrosoftOfficeThemeData = 325,
it_MIDI = 326,
it_OutlookExpressMessageStore2 = 327,
it_PowerPoint4 = 328,
it_PowerPoint95 = 329,
it_PowerPoint3 = 330,
it_Ichitaro5 = 331,
it_OleDataMso = 332,
it_CsvAsReport = 333,
it_CsvAsDocument = 334,
it_MicrosoftAccessAsDocument = 335,
it_XBaseAsDocument = 336,
it_OneNote2003 = 337,
it_OneNote2007 = 338,
it_OneNote2010 = 339,
it_JpegXR = 340,
it_WindowsExecutable = 341,
it_ElfExecutable = 342,
it_ICalendar = 343,
it_MicrosoftPublisher = 344,
it_PhotoshopImage = 346,
it_Cals = 347,
it_iWork2009 = 348,
it_iWork2009Pages = 349,
it_iWork2009Numbers = 350,
it_iWork2009Keynote = 351,
it_Visio2013 = 352,
it_SASF = 353,
it_Unigraphics2 = 354,
it_OneNoteOnline = 355,
it_7z = 359
}
Members
Members |
Description |
---|---|
it_WordList |
List of words in UTF-8 format, with the word ordinal in front of each word |
it_ContentAsXml |
Output format for FileConverter that organizes document content, metadata, and attachments into a standard XML format |
it_Ami |
Ami Pro |
it_Ansi |
Ansi text file |
it_Ascii |
Ascii (DOS) text file |
it_Binary |
Binary file (unrecognized format) |
it_CompoundDoc |
OLE Compound Document (or "DocFile") |
it_DBF |
XBase database file |
it_FilteredBinary |
Filtered binary file |
it_HyperText |
Obsolete |
it_MS_Word |
Obsolete |
it_MS_Works |
Microsoft Works word processor |
it_Multimate |
Multimate (any version) |
it_RTF |
Microsoft Rich Text Format |
it_WS_2000 |
Wordstar 2000 |
it_WS_5 |
WordStar version 5 or 6 |
it_WinWrite |
Windows Write |
it_WordForDos |
Word for DOS (same as Windows Write, it_WinWrite) |
it_WordForWin |
Obsolete |
it_WordForWin6 |
Microsoft Word 6.0 |
it_WordPerfect42 |
WordPerfect 4.2 |
it_WordPerfect5 |
WordPerfect 5 |
it_WordPerfect6 |
WordPerfect 6 |
it_WordStar |
WordStar through version 4 |
it_XyWrite |
XyWrite |
it_ZIP |
ZIP archive |
it_Properties |
PropertySet stream in a Compound Document |
it_Excel5 |
Excel versions 5 and 7 |
it_HTML |
HTML |
it_PDF |
PDF |
it_WordForWin97 |
Word For Windows 97, 2000, XP, or 2003 |
it_Excel97 |
Excel 97, 2000, XP, or 2003 |
it_PowerPoint |
PowerPoint 97-2003 |
it_EncryptedHtml |
Obsolete |
it_DatabaseRecord |
Record in a database file (such as XBase or Access) |
it_SegmentedText |
Text segmented using File Segmentation Rules |
it_XML |
XML |
it_WordPerfectEmbedded |
WordPerfect document embedded in another file |
it_Unicode |
UCS-16 text |
it_EudoraMessage |
Message in a Eudora message store |
it_Utf8 |
UTF-8 text |
it_OutlookExpressMessage |
Message in an Outlook Express message store |
it_MimeMessage |
dtSearch 6.40 and earlier file parser for .eml files |
it_SingleByteText |
Single-byte text, encoding automatically detected |
it_MBoxArchive |
Email archive conforming to the MBOX standard (dtSearch versions 7.50 and earlier) |
it_FilteredBinaryUnicode |
Binary file filtered using Unicode Filtering |
it_ZIP_zlib |
ZIP file parsed using zlib |
it_OutlookMsgFile |
Microsoft Outlook .MSG file |
it_TreepadHjtFile |
TreePad file (HJT format in TreePad 6 and earlier) |
it_PfsProfessionalWrite |
PFS Professional Write file |
it_FilteredBinaryUnicodeStream |
Binary file filtered using Unicode Filtering, not split into segments |
it_DocFile |
Compound document (new parser) |
it_Media |
Music or video file |
it_NonTextData |
Data file with no text to index |
it_EML |
Mime stream handled as a single document |
it_MicrosoftWord |
Microsoft Word 95 - 2003 (dtSearch versions 6.5 and later) |
it_UnformattedHTML |
Output format only, for generating a synopsis that is HTML-encoded but that does not include formatting such as font settings, paragraph breaks, etc. |
it_DatabaseRecord2 |
Database record (rendered as HTML) |
it_Excel2003Xml |
Microsoft Excel 2003 XML format |
it_Word2003Xml |
Microsoft Word 2003 XML format |
it_OpenOfficeDocument |
OpenOffice versions 1, 2, and 3 documents, spreadsheets, and presentations (*.sxc, *.sxd, *.sxi, *.sxw, *.sxg, *.stc, *.sti, *.stw, *.stm, *.odt, *.ott, *.odg, *.otg, *.odp, *.otp, *.ods, *.ots, *.odf) (includes OASIS Open Document Format for Office Applications) |
it_CSV |
Comma-separated values file |
it_MicrosoftAccess |
Microsoft Access database |
it_XBase |
XBase database |
it_OutlookExpressMessageStore |
Outlook Express dbx archive (versions 7.67 and earlier) |
it_IFilter |
File type processed using installed IFilter |
it_Gzip |
Archive compressed with gzip |
it_Excel4 |
Excel version 4 |
it_Word12 |
Word 2007 |
it_Excel12 |
Excel 2007 |
it_PowerPoint12 |
PowerPoint 2007 |
it_TNEF |
Transport-neutral encapsulation format |
it_XPS |
XML Paper Specification (Metro) |
it_WMF |
Windows Metafile Format (Win16) |
it_EMF |
Windows Metafile Format (Win32) |
it_TAR |
TAR archive |
it_Excel2 |
Excel Version 2 |
it_Excel3 |
Excel version 3 |
it_MBoxArchive2 |
Email archive conforming to the MBOX standard (dtSearch versions 7.51 and later) |
it_Lotus123 |
Lotus 123 spreadsheet |
it_MsWorksWps4 |
Microsoft Works WPS versions 4 and 5 |
it_MsWorksWps6 |
Microsoft Works WPS versions 6, 7, 8, and 9 |
it_QuattroPro |
Quattro Pro 9 and newer |
it_QuattroPro8 |
Quattro Pro 8 and older |
it_OutlookMsgAsContainer |
Outlook .MSG file processed as a container |
it_MimeContainer |
MIME-encoded message, processed as a container |
it_PdfWithAttachments |
PDF file with attachments |
it_MicrosoftAccess2 |
Microsoft Access (parsed directly, not via ODBC or the Jet Engine) |
it_FlashSWF |
Flash SWF |
it_RAR |
RAR archive |
it_NoContent |
File indexed with all content ignored (see dtsoIndexBinaryNoContent) |
it_Excel12xlsb |
Excel 2007 XLSB format |
it_XfaForm |
XFA form |
it_MifFile |
Framemaker MIF file |
it_WordForWindows2 |
Word for Windows 2 |
it_ASF |
ASF file |
it_MP3 |
MP3 file |
it_QuickTime |
QuickTime file |
it_MP4 |
MP4 file |
it_M4A |
M4A file |
it_MPG |
MPEG file |
it_JPEG |
JPEG file |
it_TIFF |
TIFF file |
it_MDI |
MDI image file |
it_GIF |
GIF image file |
it_PNG |
PNG image file |
it_CAB |
CAB archive |
it_dtSearchIndex |
dtSearch index file |
it_HtmlHelp |
HTML Help CHM file |
it_TrueTypeFont |
TrueType TTF file |
it_WAV |
WAV sound file |
it_BMP |
BMP image file |
it_AVI |
AVI file |
it_Visio |
Visio file |
it_Ichitaro |
Ichitaro word processor file (versions 8 through 2011) |
it_SolidWorks |
SolidWorks file |
it_Unigraphics |
Unigraphics file (docfile format) |
it_DWG |
DWG CAD file |
it_DWF |
DWF CAD file |
it_DXF |
DXF CAD file |
it_VisioXml |
Visio XML file |
it_WordForWindows1 |
Word for Windows 1 |
it_OutlookPst |
Outlook PST message store |
it_MicrosoftOfficeThemeData |
Microsoft Office .thmx file with theme data |
it_MIDI |
MIDI file |
it_OutlookExpressMessageStore2 |
Outlook Express dbx archive |
it_PowerPoint4 |
PowerPoint 4 |
it_PowerPoint95 |
PowerPoint 95 |
it_PowerPoint3 |
PowerPoint 3 |
it_Ichitaro5 |
Ichitaro versions 5, 6, 7 |
it_OleDataMso |
oledata.mso file |
it_CsvAsReport |
CSV file parsed as report (like a spreadsheet) instead of a database |
it_CsvAsDocument |
CSV file parsed as a single file listing all records |
it_MicrosoftAccessAsDocument |
Access database parsed as a single file listing all records |
it_XBaseAsDocument |
XBase file parsed as a single file listing all records |
it_OneNote2003 |
not supported |
it_OneNote2007 |
OneNote 2007 |
it_OneNote2010 |
OneNote 2010, 2013, and 2016 |
it_JpegXR |
Windows Media Photo/HDPhoto/*.wdp |
it_WindowsExecutable |
Windows .exe or .dll |
it_ElfExecutable |
ELF format executable |
it_ICalendar |
ICalendar (*.ics) file |
it_MicrosoftPublisher |
Microsoft Publisher file |
it_PhotoshopImage |
Photoshop Image (*.psd) |
it_Cals |
CALS metadata format described in MIL-STD-1840C |
it_iWork2009 |
IWork 2009 |
it_iWork2009Pages |
IWork 2009 Pages document |
it_iWork2009Numbers |
IWork 2009 Numbers spreadsheet |
it_iWork2009Keynote |
IWork 2009 Keynote presentation |
it_Visio2013 |
Visio 2013 document |
it_SASF |
SASF call center audio file |
it_Unigraphics2 |
Unigraphics file (#UGC format) |
it_OneNoteOnline |
OneNote variant generated by Microsoft online services |
it_7z |
7-zip archive (not supported) |
Remarks
Because some older file parsers are still supported for backward compatibility, in a few cases there may be more than one TypeId for a file format. Not all file formats listed are supported for content extraction or indexing. For a current list of supported file types, see: http://support.dtsearch.com/faq/dts0103.htm
See Also