msdos 44 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200
  1. #------------------------------------------------------------------------------
  2. # $File: msdos,v 1.118 2017/05/20 19:55:27 christos Exp $
  3. # msdos: file(1) magic for MS-DOS files
  4. #
  5. # .BAT files (Daniel Quinlan, quinlan@yggdrasil.com)
  6. # updated by Joerg Jenderek at Oct 2008,Apr 2011
  7. 0 string/t @
  8. >1 string/cW \ echo\ off DOS batch file text
  9. !:mime text/x-msdos-batch
  10. >1 string/cW echo\ off DOS batch file text
  11. !:mime text/x-msdos-batch
  12. >1 string/cW rem DOS batch file text
  13. !:mime text/x-msdos-batch
  14. >1 string/cW set\ DOS batch file text
  15. !:mime text/x-msdos-batch
  16. # OS/2 batch files are REXX. the second regex is a bit generic, oh well
  17. # the matched commands seem to be common in REXX and uncommon elsewhere
  18. 100 search/0xffff rxfuncadd
  19. >100 regex/c =^[\ \t]{0,10}call[\ \t]{1,10}rxfunc OS/2 REXX batch file text
  20. 100 search/0xffff say
  21. >100 regex/c =^[\ \t]{0,10}say\ ['"] OS/2 REXX batch file text
  22. # updated by Joerg Jenderek at Oct 2015
  23. # https://de.wikipedia.org/wiki/Common_Object_File_Format
  24. # http://www.delorie.com/djgpp/doc/coff/filhdr.html
  25. # ./intel already labeled COFF type 0x14c=0514 as "80386 COFF executable"
  26. #0 leshort 0x14c MS Windows COFF Intel 80386 object file
  27. #>4 ledate x stamp %s
  28. 0 leshort 0x166 MS Windows COFF MIPS R4000 object file
  29. #>4 ledate x stamp %s
  30. 0 leshort 0x184 MS Windows COFF Alpha object file
  31. #>4 ledate x stamp %s
  32. 0 leshort 0x268 MS Windows COFF Motorola 68000 object file
  33. #>4 ledate x stamp %s
  34. 0 leshort 0x1f0 MS Windows COFF PowerPC object file
  35. #>4 ledate x stamp %s
  36. 0 leshort 0x290 MS Windows COFF PA-RISC object file
  37. #>4 ledate x stamp %s
  38. # Tests for various EXE types.
  39. #
  40. # Many of the compressed formats were extraced from IDARC 1.23 source code.
  41. #
  42. 0 string/b MZ
  43. # All non-DOS EXE extensions have the relocation table more than 0x40 bytes into the file.
  44. >0x18 leshort <0x40 MS-DOS executable
  45. !:mime application/x-dosexec
  46. # These traditional tests usually work but not always. When test quality support is
  47. # implemented these can be turned on.
  48. #>>0x18 leshort 0x1c (Borland compiler)
  49. #>>0x18 leshort 0x1e (MS compiler)
  50. # If the relocation table is 0x40 or more bytes into the file, it's definitely
  51. # not a DOS EXE.
  52. >0x18 leshort >0x3f
  53. # Maybe it's a PE?
  54. >>(0x3c.l) string PE\0\0 PE
  55. !:mime application/x-dosexec
  56. >>>(0x3c.l+24) leshort 0x010b \b32 executable
  57. >>>(0x3c.l+24) leshort 0x020b \b32+ executable
  58. >>>(0x3c.l+24) leshort 0x0107 ROM image
  59. >>>(0x3c.l+24) default x Unknown PE signature
  60. >>>>&0 leshort x 0x%x
  61. >>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
  62. >>>(0x3c.l+92) leshort 1 (native)
  63. >>>(0x3c.l+92) leshort 2 (GUI)
  64. >>>(0x3c.l+92) leshort 3 (console)
  65. >>>(0x3c.l+92) leshort 7 (POSIX)
  66. >>>(0x3c.l+92) leshort 9 (Windows CE)
  67. >>>(0x3c.l+92) leshort 10 (EFI application)
  68. >>>(0x3c.l+92) leshort 11 (EFI boot service driver)
  69. >>>(0x3c.l+92) leshort 12 (EFI runtime driver)
  70. >>>(0x3c.l+92) leshort 13 (EFI ROM)
  71. >>>(0x3c.l+92) leshort 14 (XBOX)
  72. >>>(0x3c.l+92) leshort 15 (Windows boot application)
  73. >>>(0x3c.l+92) default x (Unknown subsystem
  74. >>>>&0 leshort x 0x%x)
  75. >>>(0x3c.l+4) leshort 0x14c Intel 80386
  76. >>>(0x3c.l+4) leshort 0x166 MIPS R4000
  77. >>>(0x3c.l+4) leshort 0x168 MIPS R10000
  78. >>>(0x3c.l+4) leshort 0x184 Alpha
  79. >>>(0x3c.l+4) leshort 0x1a2 Hitachi SH3
  80. >>>(0x3c.l+4) leshort 0x1a6 Hitachi SH4
  81. >>>(0x3c.l+4) leshort 0x1c0 ARM
  82. >>>(0x3c.l+4) leshort 0x1c2 ARM Thumb
  83. >>>(0x3c.l+4) leshort 0x1c4 ARMv7 Thumb
  84. >>>(0x3c.l+4) leshort 0x1f0 PowerPC
  85. >>>(0x3c.l+4) leshort 0x200 Intel Itanium
  86. >>>(0x3c.l+4) leshort 0x266 MIPS16
  87. >>>(0x3c.l+4) leshort 0x268 Motorola 68000
  88. >>>(0x3c.l+4) leshort 0x290 PA-RISC
  89. >>>(0x3c.l+4) leshort 0x366 MIPSIV
  90. >>>(0x3c.l+4) leshort 0x466 MIPS16 with FPU
  91. >>>(0x3c.l+4) leshort 0xebc EFI byte code
  92. >>>(0x3c.l+4) leshort 0x8664 x86-64
  93. >>>(0x3c.l+4) leshort 0xc0ee MSIL
  94. >>>(0x3c.l+4) default x Unknown processor type
  95. >>>>&0 leshort x 0x%x
  96. >>>(0x3c.l+22) leshort&0x0200 >0 (stripped to external PDB)
  97. >>>(0x3c.l+22) leshort&0x1000 >0 system file
  98. >>>(0x3c.l+24) leshort 0x010b
  99. >>>>(0x3c.l+232) lelong >0 Mono/.Net assembly
  100. >>>(0x3c.l+24) leshort 0x020b
  101. >>>>(0x3c.l+248) lelong >0 Mono/.Net assembly
  102. # hooray, there's a DOS extender using the PE format, with a valid PE
  103. # executable inside (which just prints a message and exits if run in win)
  104. >>>(8.s*16) string 32STUB \b, 32rtm DOS extender
  105. >>>(8.s*16) string !32STUB \b, for MS Windows
  106. >>>(0x3c.l+0xf8) string UPX0 \b, UPX compressed
  107. >>>(0x3c.l+0xf8) search/0x140 PEC2 \b, PECompact2 compressed
  108. >>>(0x3c.l+0xf8) search/0x140 UPX2
  109. >>>>(&0x10.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
  110. >>>(0x3c.l+0xf8) search/0x140 .idata
  111. >>>>(&0xe.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
  112. >>>>(&0xe.l+(-4)) string ZZ0 \b, ZZip self-extracting archive
  113. >>>>(&0xe.l+(-4)) string ZZ1 \b, ZZip self-extracting archive
  114. >>>(0x3c.l+0xf8) search/0x140 .rsrc
  115. >>>>(&0x0f.l+(-4)) string a\\\4\5 \b, WinHKI self-extracting archive
  116. >>>>(&0x0f.l+(-4)) string Rar! \b, RAR self-extracting archive
  117. >>>>(&0x0f.l+(-4)) search/0x3000 MSCF \b, InstallShield self-extracting archive
  118. >>>>(&0x0f.l+(-4)) search/32 Nullsoft \b, Nullsoft Installer self-extracting archive
  119. >>>(0x3c.l+0xf8) search/0x140 .data
  120. >>>>(&0x0f.l) string WEXTRACT \b, MS CAB-Installer self-extracting archive
  121. >>>(0x3c.l+0xf8) search/0x140 .petite\0 \b, Petite compressed
  122. >>>>(0x3c.l+0xf7) byte x
  123. >>>>>(&0x104.l+(-4)) string =!sfx! \b, ACE self-extracting archive
  124. >>>(0x3c.l+0xf8) search/0x140 .WISE \b, WISE installer self-extracting archive
  125. >>>(0x3c.l+0xf8) search/0x140 .dz\0\0\0 \b, Dzip self-extracting archive
  126. >>>&(0x3c.l+0xf8) search/0x100 _winzip_ \b, ZIP self-extracting archive (WinZip)
  127. >>>&(0x3c.l+0xf8) search/0x100 SharedD \b, Microsoft Installer self-extracting archive
  128. >>>0x30 string Inno \b, InnoSetup self-extracting archive
  129. # Hmm, not a PE but the relocation table is too high for a traditional DOS exe,
  130. # must be one of the unusual subformats.
  131. >>(0x3c.l) string !PE\0\0 MS-DOS executable
  132. !:mime application/x-dosexec
  133. >>(0x3c.l) string NE \b, NE
  134. !:mime application/x-dosexec
  135. >>>(0x3c.l+0x36) byte 1 for OS/2 1.x
  136. >>>(0x3c.l+0x36) byte 2 for MS Windows 3.x
  137. >>>(0x3c.l+0x36) byte 3 for MS-DOS
  138. >>>(0x3c.l+0x36) byte 4 for Windows 386
  139. >>>(0x3c.l+0x36) byte 5 for Borland Operating System Services
  140. >>>(0x3c.l+0x36) default x
  141. >>>>(0x3c.l+0x36) byte x (unknown OS %x)
  142. >>>(0x3c.l+0x36) byte 0x81 for MS-DOS, Phar Lap DOS extender
  143. >>>(0x3c.l+0x0c) leshort&0x8003 0x8002 (DLL)
  144. >>>(0x3c.l+0x0c) leshort&0x8003 0x8001 (driver)
  145. >>>&(&0x24.s-1) string ARJSFX \b, ARJ self-extracting archive
  146. >>>(0x3c.l+0x70) search/0x80 WinZip(R)\ Self-Extractor \b, ZIP self-extracting archive (WinZip)
  147. >>(0x3c.l) string LX\0\0 \b, LX
  148. !:mime application/x-dosexec
  149. >>>(0x3c.l+0x0a) leshort <1 (unknown OS)
  150. >>>(0x3c.l+0x0a) leshort 1 for OS/2
  151. >>>(0x3c.l+0x0a) leshort 2 for MS Windows
  152. >>>(0x3c.l+0x0a) leshort 3 for DOS
  153. >>>(0x3c.l+0x0a) leshort >3 (unknown OS)
  154. >>>(0x3c.l+0x10) lelong&0x28000 =0x8000 (DLL)
  155. >>>(0x3c.l+0x10) lelong&0x20000 >0 (device driver)
  156. >>>(0x3c.l+0x10) lelong&0x300 0x300 (GUI)
  157. >>>(0x3c.l+0x10) lelong&0x28300 <0x300 (console)
  158. >>>(0x3c.l+0x08) leshort 1 i80286
  159. >>>(0x3c.l+0x08) leshort 2 i80386
  160. >>>(0x3c.l+0x08) leshort 3 i80486
  161. >>>(8.s*16) string emx \b, emx
  162. >>>>&1 string x %s
  163. >>>&(&0x54.l-3) string arjsfx \b, ARJ self-extracting archive
  164. # MS Windows system file, supposedly a collection of LE executables
  165. >>(0x3c.l) string W3 \b, W3 for MS Windows
  166. !:mime application/x-dosexec
  167. >>(0x3c.l) string LE\0\0 \b, LE executable
  168. !:mime application/x-dosexec
  169. >>>(0x3c.l+0x0a) leshort 1
  170. # some DOS extenders use LE files with OS/2 header
  171. >>>>0x240 search/0x100 DOS/4G for MS-DOS, DOS4GW DOS extender
  172. >>>>0x240 search/0x200 WATCOM\ C/C++ for MS-DOS, DOS4GW DOS extender
  173. >>>>0x440 search/0x100 CauseWay\ DOS\ Extender for MS-DOS, CauseWay DOS extender
  174. >>>>0x40 search/0x40 PMODE/W for MS-DOS, PMODE/W DOS extender
  175. >>>>0x40 search/0x40 STUB/32A for MS-DOS, DOS/32A DOS extender (stub)
  176. >>>>0x40 search/0x80 STUB/32C for MS-DOS, DOS/32A DOS extender (configurable stub)
  177. >>>>0x40 search/0x80 DOS/32A for MS-DOS, DOS/32A DOS extender (embedded)
  178. # this is a wild guess; hopefully it is a specific signature
  179. >>>>&0x24 lelong <0x50
  180. >>>>>(&0x4c.l) string \xfc\xb8WATCOM
  181. >>>>>>&0 search/8 3\xdbf\xb9 \b, 32Lite compressed
  182. # another wild guess: if real OS/2 LE executables exist, they probably have higher start EIP
  183. #>>>>(0x3c.l+0x1c) lelong >0x10000 for OS/2
  184. # fails with DOS-Extenders.
  185. >>>(0x3c.l+0x0a) leshort 2 for MS Windows
  186. >>>(0x3c.l+0x0a) leshort 3 for DOS
  187. >>>(0x3c.l+0x0a) leshort 4 for MS Windows (VxD)
  188. >>>(&0x7c.l+0x26) string UPX \b, UPX compressed
  189. >>>&(&0x54.l-3) string UNACE \b, ACE self-extracting archive
  190. # looks like ASCII, probably some embedded copyright message.
  191. # and definitely not NE/LE/LX/PE
  192. >>0x3c lelong >0x20000000
  193. >>>(4.s*512) leshort !0x014c \b, MZ for MS-DOS
  194. !:mime application/x-dosexec
  195. # header data too small for extended executable
  196. >2 long !0
  197. >>0x18 leshort <0x40
  198. >>>(4.s*512) leshort !0x014c
  199. >>>>&(2.s-514) string !LE
  200. >>>>>&-2 string !BW \b, MZ for MS-DOS
  201. !:mime application/x-dosexec
  202. >>>>&(2.s-514) string LE \b, LE
  203. >>>>>0x240 search/0x100 DOS/4G for MS-DOS, DOS4GW DOS extender
  204. # educated guess since indirection is still not capable enough for complex offset
  205. # calculations (next embedded executable would be at &(&2*512+&0-2)
  206. # I suspect there are only LE executables in these multi-exe files
  207. >>>>&(2.s-514) string BW
  208. >>>>>0x240 search/0x100 DOS/4G \b, LE for MS-DOS, DOS4GW DOS extender (embedded)
  209. >>>>>0x240 search/0x100 !DOS/4G \b, BW collection for MS-DOS
  210. # This sequence skips to the first COFF segment, usually .text
  211. >(4.s*512) leshort 0x014c \b, COFF
  212. !:mime application/x-dosexec
  213. >>(8.s*16) string go32stub for MS-DOS, DJGPP go32 DOS extender
  214. >>(8.s*16) string emx
  215. >>>&1 string x for DOS, Win or OS/2, emx %s
  216. >>&(&0x42.l-3) byte x
  217. >>>&0x26 string UPX \b, UPX compressed
  218. # and yet another guess: small .text, and after large .data is unusal, could be 32lite
  219. >>&0x2c search/0xa0 .text
  220. >>>&0x0b lelong <0x2000
  221. >>>>&0 lelong >0x6000 \b, 32lite compressed
  222. >(8.s*16) string $WdX \b, WDos/X DOS extender
  223. # By now an executable type should have been printed out. The executable
  224. # may be a self-uncompressing archive, so look for evidence of that and
  225. # print it out.
  226. #
  227. # Some signatures below from Greg Roelofs, newt@uchicago.edu.
  228. #
  229. >0x35 string \x8e\xc0\xb9\x08\x00\xf3\xa5\x4a\x75\xeb\x8e\xc3\x8e\xd8\x33\xff\xbe\x30\x00\x05 \b, aPack compressed
  230. >0xe7 string LH/2\ Self-Extract \b, %s
  231. >0x1c string UC2X \b, UCEXE compressed
  232. >0x1c string WWP\ \b, WWPACK compressed
  233. >0x1c string RJSX \b, ARJ self-extracting archive
  234. >0x1c string diet \b, diet compressed
  235. >0x1c string LZ09 \b, LZEXE v0.90 compressed
  236. >0x1c string LZ91 \b, LZEXE v0.91 compressed
  237. >0x1c string tz \b, TinyProg compressed
  238. >0x1e string Copyright\ 1989-1990\ PKWARE\ Inc. Self-extracting PKZIP archive
  239. !:mime application/zip
  240. # Yes, this really is "Copr", not "Corp."
  241. >0x1e string PKLITE\ Copr. Self-extracting PKZIP archive
  242. !:mime application/zip
  243. # winarj stores a message in the stub instead of the sig in the MZ header
  244. >0x20 search/0xe0 aRJsfX \b, ARJ self-extracting archive
  245. >0x20 string AIN
  246. >>0x23 string 2 \b, AIN 2.x compressed
  247. >>0x23 string <2 \b, AIN 1.x compressed
  248. >>0x23 string >2 \b, AIN 1.x compressed
  249. >0x24 string LHa's\ SFX \b, LHa self-extracting archive
  250. !:mime application/x-lha
  251. >0x24 string LHA's\ SFX \b, LHa self-extracting archive
  252. !:mime application/x-lha
  253. >0x24 string \ $ARX \b, ARX self-extracting archive
  254. >0x24 string \ $LHarc \b, LHarc self-extracting archive
  255. >0x20 string SFX\ by\ LARC \b, LARC self-extracting archive
  256. >0x40 string aPKG \b, aPackage self-extracting archive
  257. >0x64 string W\ Collis\0\0 \b, Compack compressed
  258. >0x7a string Windows\ self-extracting\ ZIP \b, ZIP self-extracting archive
  259. >>&0xf4 search/0x140 \x0\x40\x1\x0
  260. >>>(&0.l+(4)) string MSCF \b, WinHKI CAB self-extracting archive
  261. >1638 string -lh5- \b, LHa self-extracting archive v2.13S
  262. >0x17888 string Rar! \b, RAR self-extracting archive
  263. # Skip to the end of the EXE. This will usually work fine in the PE case
  264. # because the MZ image is hardcoded into the toolchain and almost certainly
  265. # won't match any of these signatures.
  266. >(4.s*512) long x
  267. >>&(2.s-517) byte x
  268. >>>&0 string PK\3\4 \b, ZIP self-extracting archive
  269. >>>&0 string Rar! \b, RAR self-extracting archive
  270. >>>&0 string =!\x11 \b, AIN 2.x self-extracting archive
  271. >>>&0 string =!\x12 \b, AIN 2.x self-extracting archive
  272. >>>&0 string =!\x17 \b, AIN 1.x self-extracting archive
  273. >>>&0 string =!\x18 \b, AIN 1.x self-extracting archive
  274. >>>&7 search/400 **ACE** \b, ACE self-extracting archive
  275. >>>&0 search/0x480 UC2SFX\ Header \b, UC2 self-extracting archive
  276. # a few unknown ZIP sfxes, no idea if they are needed or if they are
  277. # already captured by the generic patterns above
  278. >(8.s*16) search/0x20 PKSFX \b, ZIP self-extracting archive (PKZIP)
  279. # TODO: how to add this? >FileSize-34 string Windows\ Self-Installing\ Executable \b, ZIP self-extracting archive
  280. #
  281. # TELVOX Teleinformatica CODEC self-extractor for OS/2:
  282. >49801 string \x79\xff\x80\xff\x76\xff \b, CODEC archive v3.21
  283. >>49824 leshort =1 \b, 1 file
  284. >>49824 leshort >1 \b, %u files
  285. # added by Joerg Jenderek of http://www.freedos.org/software/?prog=kc
  286. # and http://www.freedos.org/software/?prog=kpdos
  287. # for FreeDOS files like KEYBOARD.SYS, KEYBRD2.SYS, KEYBRD3.SYS, *.KBD
  288. 0 string/b KCF FreeDOS KEYBoard Layout collection
  289. # only version=0x100 found
  290. >3 uleshort x \b, version 0x%x
  291. # length of string containing author,info and special characters
  292. >6 ubyte >0
  293. #>>6 pstring x \b, name=%s
  294. >>7 string >\0 \b, author=%-.14s
  295. >>7 search/254 \xff \b, info=
  296. #>>>&0 string x \b%-s
  297. >>>&0 string x \b%-.15s
  298. # for FreeDOS *.KL files
  299. 0 string/b KLF FreeDOS KEYBoard Layout file
  300. # only version=0x100 or 0x101 found
  301. >3 uleshort x \b, version 0x%x
  302. # stringlength
  303. >5 ubyte >0
  304. >>8 string x \b, name=%-.2s
  305. 0 string \xffKEYB\ \ \ \0\0\0\0
  306. >12 string \0\0\0\0`\004\360 MS-DOS KEYBoard Layout file
  307. # DOS device driver updated by Joerg Jenderek at May 2011,Mar 2017
  308. # https://amaus.net/static/S100/IBM/software/DOS/DOS%20techref/CHAPTER.009
  309. 0 ulequad&0x07a0ffffffff 0xffffffff
  310. >0 use msdos-driver
  311. 0 name msdos-driver DOS executable (
  312. #!:mime application/octet-stream
  313. !:mime application/x-dosdriver
  314. # also found FreeDOS print driver SPOOL.DEV and disc compression driver STACLOAD.BIN
  315. !:ext sys/dev/bin
  316. >40 search/7 UPX! \bUPX compressed
  317. # DOS device driver attributes
  318. >4 uleshort&0x8000 0x0000 \bblock device driver
  319. # character device
  320. >4 uleshort&0x8000 0x8000 \b
  321. >>4 uleshort&0x0008 0x0008 \bclock
  322. # fast video output by int 29h
  323. >>4 uleshort&0x0010 0x0010 \bfast
  324. # standard input/output device
  325. >>4 uleshort&0x0003 >0 \bstandard
  326. >>>4 uleshort&0x0001 0x0001 \binput
  327. >>>4 uleshort&0x0003 0x0003 \b/
  328. >>>4 uleshort&0x0002 0x0002 \boutput
  329. >>4 uleshort&0x8000 0x8000 \bcharacter device driver
  330. >0 ubyte x
  331. # upx compressed device driver has garbage instead of real in name field of header
  332. >>40 search/7 UPX!
  333. >>40 default x
  334. # leading/trailing nulls, zeros or non ASCII characters in 8-byte name field at offset 10 are skipped
  335. >>>12 ubyte >0x2E \b
  336. >>>>10 ubyte >0x20
  337. >>>>>10 ubyte !0x2E
  338. >>>>>>10 ubyte !0x2A \b%c
  339. >>>>11 ubyte >0x20
  340. >>>>>11 ubyte !0x2E \b%c
  341. >>>>12 ubyte >0x20
  342. >>>>>12 ubyte !0x39
  343. >>>>>>12 ubyte !0x2E \b%c
  344. >>>13 ubyte >0x20
  345. >>>>13 ubyte !0x2E \b%c
  346. >>>>14 ubyte >0x20
  347. >>>>>14 ubyte !0x2E \b%c
  348. >>>>15 ubyte >0x20
  349. >>>>>15 ubyte !0x2E \b%c
  350. >>>>16 ubyte >0x20
  351. >>>>>16 ubyte !0x2E
  352. >>>>>>16 ubyte <0xCB \b%c
  353. >>>>17 ubyte >0x20
  354. >>>>>17 ubyte !0x2E
  355. >>>>>>17 ubyte <0x90 \b%c
  356. # some character device drivers like ASPICD.SYS, btcdrom.sys and Cr_atapi.sys contain only spaces or points in name field
  357. >>>12 ubyte <0x2F
  358. # they have their real name at offset 22
  359. # also block device drivers like DUMBDRV.SYS
  360. >>>>22 string >\056 %-.6s
  361. >4 uleshort&0x8000 0x0000
  362. # 32 bit sector addressing ( > 32 MB) for block devices
  363. >>4 uleshort&0x0002 0x0002 \b,32-bit sector-
  364. # support by driver functions 13h, 17h, 18h
  365. >4 uleshort&0x0040 0x0040 \b,IOCTL-
  366. # open, close, removable media support by driver functions 0Dh, 0Eh, 0Fh
  367. >4 uleshort&0x0800 0x0800 \b,close media-
  368. # output until busy support by int 10h for character device driver
  369. >4 uleshort&0x8000 0x8000
  370. >>4 uleshort&0x2000 0x2000 \b,until busy-
  371. # direct read/write support by driver functions 03h,0Ch
  372. >4 uleshort&0x4000 0x4000 \b,control strings-
  373. >4 uleshort&0x8000 0x8000
  374. >>4 uleshort&0x6840 >0 \bsupport
  375. >4 uleshort&0x8000 0x0000
  376. >>4 uleshort&0x4842 >0 \bsupport
  377. >0 ubyte x \b)
  378. # DOS driver cmd640x.sys has 0x12 instead of 0xffffffff for pointer field to next device header
  379. 0 ulequad 0x0513c00000000012
  380. >0 use msdos-driver
  381. # DOS drivers DC2975.SYS, DUMBDRV.SYS, ECHO.SYS has also none 0xffffffff for pointer field
  382. 0 ulequad 0x32f28000ffff0016
  383. >0 use msdos-driver
  384. 0 ulequad 0x007f00000000ffff
  385. >0 use msdos-driver
  386. 0 ulequad 0x001600000000ffff
  387. >0 use msdos-driver
  388. # DOS drivers LS120.SYS, MKELS120.SYS use reserved bits of attribute field
  389. 0 ulequad 0x0bf708c2ffffffff
  390. >0 use msdos-driver
  391. 0 ulequad 0x07bd08c2ffffffff
  392. >0 use msdos-driver
  393. # updated by Joerg Jenderek
  394. # GRR: line below too general as it catches also
  395. # rt.lib DYADISKS.PIC and many more
  396. # start with assembler instruction MOV
  397. 0 ubyte 0x8c
  398. # skip "AppleWorks word processor data" like ARTICLE.1 ./apple
  399. >4 string !O====
  400. # skip some unknown basic binaries like RocketRnger.SHR
  401. >>5 string !MAIN
  402. # skip "GPG symmetrically encrypted data" ./gnu
  403. # skip "PGP symmetric key encrypted data" ./pgp
  404. # openpgpdefs.h: fourth byte < 14 indicate cipher algorithm type
  405. >>>4 ubyte >13 DOS executable (COM, 0x8C-variant)
  406. # the remaining files should be DOS *.COM executables
  407. # dosshell.COM 8cc0 2ea35f07 e85211 e88a11 b80058 cd
  408. # hmload.COM 8cc8 8ec0 bbc02b 89dc 83c30f c1eb04 b4
  409. # UNDELETE.COM 8cca 2e8916 6503 b430 cd21 8b 2e0200 8b
  410. # BOOTFIX.COM 8cca 2e8916 9603 b430 cd21 8b 2e0200 8b
  411. # RAWRITE3.COM 8cca 2e8916 d602 b430 cd21 8b 2e0200 8b
  412. # SHARE.COM 8cca 2e8916 d602 b430 cd21 8b 2e0200 8b
  413. # validchr.COM 8cca 2e8916 9603 b430 cd21 8b 2e028b1e
  414. # devload.COM 8cca 8916ad01 b430 cd21 8b2e0200 892e
  415. !:mime application/x-dosexec
  416. !:ext com
  417. # updated by Joerg Jenderek at Oct 2008
  418. 0 ulelong 0xffff10eb DR-DOS executable (COM)
  419. # byte 0xeb conflicts with "sequent" magic leshort 0xn2eb
  420. 0 ubeshort&0xeb8d >0xeb00
  421. # DR-DOS STACKER.COM SCREATE.SYS missed
  422. 0 name msdos-com
  423. >0 byte x DOS executable (COM)
  424. >6 string SFX\ of\ LHarc \b, %s
  425. >0x1FE leshort 0xAA55 \b, boot code
  426. >85 string UPX \b, UPX compressed
  427. >4 string \ $ARX \b, ARX self-extracting archive
  428. >4 string \ $LHarc \b, LHarc self-extracting archive
  429. >0x20e string SFX\ by\ LARC \b, LARC self-extracting archive
  430. # JMP 8bit
  431. 0 byte 0xeb
  432. # allow forward jumps only
  433. >1 byte >-1
  434. # that offset must be accessible
  435. >>(1.b+2) byte x
  436. >>>0 use msdos-com
  437. # JMP 16bit
  438. 0 byte 0xe9
  439. # forward jumps
  440. >1 short >-1
  441. # that offset must be accessible
  442. >>(1.s+3) byte x
  443. >>>0 use msdos-com
  444. # negative offset, must not lead into PSP
  445. >1 short <-259
  446. # that offset must be accessible
  447. >>(1,s+65539) byte x
  448. >>>0 use msdos-com
  449. # updated by Joerg Jenderek at Oct 2008,2015
  450. # following line is too general
  451. 0 ubyte 0xb8
  452. # skip 2 linux kernels like memtest.bin with "\xb8\xc0\x07\x8e" in ./linux
  453. >0 string !\xb8\xc0\x07\x8e
  454. # modified by Joerg Jenderek
  455. # syslinux COM32 or COM32R executable
  456. >>1 lelong&0xFFFFFFFe 0x21CD4CFe COM executable (32-bit COMBOOT
  457. # http://www.syslinux.org/wiki/index.php/Comboot_API
  458. # Since version 5.00 c32 modules switched from the COM32 object format to ELF
  459. !:mime application/x-c32-comboot-syslinux-exec
  460. !:ext c32
  461. # http://syslinux.zytor.com/comboot.php
  462. # older syslinux version ( <4 )
  463. # (32-bit COMBOOT) programs *.C32 contain 32-bit code and run in flat-memory 32-bit protected mode
  464. # start with assembler instructions mov eax,21cd4cffh
  465. >>>1 lelong 0x21CD4CFf \b)
  466. # syslinux:doc/comboot.txt
  467. # A COM32R program must start with the byte sequence B8 FE 4C CD 21 (mov
  468. # eax,21cd4cfeh) as a magic number.
  469. # syslinux version (4.x)
  470. # "COM executable (COM32R)" or "Syslinux COM32 module" by TrID
  471. >>>1 lelong 0x21CD4CFe \b, relocatable)
  472. # remaining are DOS COM executables starting with assembler instruction MOV
  473. # like FreeDOS BANNER*.COM FINDDISK.COM GIF2RAW.COM WINCHK.COM
  474. # MS-DOS SYS.COM RESTART.COM
  475. # SYSLINUX.COM (version 1.40 - 2.13)
  476. # GFXBOOT.COM (version 3.75)
  477. # COPYBS.COM POWEROFF.COM INT18.COM
  478. >>1 default x COM executable for DOS
  479. !:mime application/x-dosexec
  480. #!:mime application/x-ms-dos-executable
  481. #!:mime application/x-msdos-program
  482. !:ext com
  483. 0 string/b \x81\xfc
  484. >4 string \x77\x02\xcd\x20\xb9
  485. >>36 string UPX! FREE-DOS executable (COM), UPX compressed
  486. 252 string Must\ have\ DOS\ version DR-DOS executable (COM)
  487. # added by Joerg Jenderek at Oct 2008
  488. # GRR search is not working
  489. #34 search/2 UPX! FREE-DOS executable (COM), UPX compressed
  490. 34 string UPX! FREE-DOS executable (COM), UPX compressed
  491. 35 string UPX! FREE-DOS executable (COM), UPX compressed
  492. # GRR search is not working
  493. #2 search/28 \xcd\x21 COM executable for MS-DOS
  494. #WHICHFAT.cOM
  495. 2 string \xcd\x21 COM executable for DOS
  496. #DELTREE.cOM DELTREE2.cOM
  497. 4 string \xcd\x21 COM executable for DOS
  498. #IFMEMDSK.cOM ASSIGN.cOM COMP.cOM
  499. 5 string \xcd\x21 COM executable for DOS
  500. #DELTMP.COm HASFAT32.cOM
  501. 7 string \xcd\x21
  502. >0 byte !0xb8 COM executable for DOS
  503. #COMP.cOM MORE.COm
  504. 10 string \xcd\x21
  505. >5 string !\xcd\x21 COM executable for DOS
  506. #comecho.com
  507. 13 string \xcd\x21 COM executable for DOS
  508. #HELP.COm EDIT.coM
  509. 18 string \xcd\x21 COM executable for MS-DOS
  510. #NWRPLTRM.COm
  511. 23 string \xcd\x21 COM executable for MS-DOS
  512. #LOADFIX.cOm LOADFIX.cOm
  513. 30 string \xcd\x21 COM executable for MS-DOS
  514. #syslinux.com 3.11
  515. 70 string \xcd\x21 COM executable for DOS
  516. # many compressed/converted COMs start with a copy loop instead of a jump
  517. 0x6 search/0xa \xfc\x57\xf3\xa5\xc3 COM executable for MS-DOS
  518. 0x6 search/0xa \xfc\x57\xf3\xa4\xc3 COM executable for DOS
  519. >0x18 search/0x10 \x50\xa4\xff\xd5\x73 \b, aPack compressed
  520. 0x3c string W\ Collis\0\0 COM executable for MS-DOS, Compack compressed
  521. # FIXME: missing diet .com compression
  522. # miscellaneous formats
  523. 0 string/b LZ MS-DOS executable (built-in)
  524. #0 byte 0xf0 MS-DOS program library data
  525. #
  526. # AAF files:
  527. # <stuartc@rd.bbc.co.uk> Stuart Cunningham
  528. 0 string/b \320\317\021\340\241\261\032\341AAFB\015\000OM\006\016\053\064\001\001\001\377 AAF legacy file using MS Structured Storage
  529. >30 byte 9 (512B sectors)
  530. >30 byte 12 (4kB sectors)
  531. 0 string/b \320\317\021\340\241\261\032\341\001\002\001\015\000\002\000\000\006\016\053\064\003\002\001\001 AAF file using MS Structured Storage
  532. >30 byte 9 (512B sectors)
  533. >30 byte 12 (4kB sectors)
  534. # Popular applications
  535. 2080 string Microsoft\ Word\ 6.0\ Document %s
  536. !:mime application/msword
  537. 2080 string Documento\ Microsoft\ Word\ 6 Spanish Microsoft Word 6 document data
  538. !:mime application/msword
  539. # Pawel Wiecek <coven@i17linuxb.ists.pwr.wroc.pl> (for polish Word)
  540. 2112 string MSWordDoc Microsoft Word document data
  541. !:mime application/msword
  542. #
  543. 0 belong 0x31be0000 Microsoft Word Document
  544. !:mime application/msword
  545. #
  546. 0 string/b PO^Q` Microsoft Word 6.0 Document
  547. !:mime application/msword
  548. #
  549. 4 long 0
  550. >0 belong 0xfe320000 Microsoft Word for Macintosh 1.0
  551. !:mime application/msword
  552. !:ext mcw
  553. >0 belong 0xfe340000 Microsoft Word for Macintosh 3.0
  554. !:mime application/msword
  555. !:ext mcw
  556. >0 belong 0xfe37001c Microsoft Word for Macintosh 4.0
  557. !:mime application/msword
  558. !:ext mcw
  559. >0 belong 0xfe370023 Microsoft Word for Macintosh 5.0
  560. !:mime application/msword
  561. !:ext mcw
  562. 0 string/b \333\245-\0\0\0 Microsoft Word 2.0 Document
  563. !:mime application/msword
  564. !:ext doc
  565. 512 string/b \354\245\301 Microsoft Word Document
  566. !:mime application/msword
  567. #
  568. 0 string/b \xDB\xA5\x2D\x00 Microsoft WinWord 2.0 Document
  569. !:mime application/msword
  570. #
  571. 2080 string Microsoft\ Excel\ 5.0\ Worksheet %s
  572. !:mime application/vnd.ms-excel
  573. #
  574. 0 string/b \xDB\xA5\x2D\x00 Microsoft WinWord 2.0 Document
  575. !:mime application/msword
  576. 2080 string Foglio\ di\ lavoro\ Microsoft\ Exce %s
  577. !:mime application/vnd.ms-excel
  578. #
  579. # Pawel Wiecek <coven@i17linuxb.ists.pwr.wroc.pl> (for polish Excel)
  580. 2114 string Biff5 Microsoft Excel 5.0 Worksheet
  581. !:mime application/vnd.ms-excel
  582. # Italian MS-Excel
  583. 2121 string Biff5 Microsoft Excel 5.0 Worksheet
  584. !:mime application/vnd.ms-excel
  585. 0 string/b \x09\x04\x06\x00\x00\x00\x10\x00 Microsoft Excel Worksheet
  586. !:mime application/vnd.ms-excel
  587. #
  588. # Update: Joerg Jenderek
  589. # URL: https://en.wikipedia.org/wiki/Lotus_1-2-3
  590. # Reference: http://www.aboutvb.de/bas/formate/pdf/wk3.pdf
  591. # Note: newer Lotus versions >2 use longer BOF record
  592. # record type (BeginningOfFile=0000h) + length (001Ah)
  593. 0 belong 0x00001a00
  594. # reserved should be 0h but 8c0dh for TUTMAC.WK3, 5h for SAMPADNS.WK3, 1h for a_readme.wk3, 1eh for K&G86.WK3
  595. #>18 uleshort&0x73E0 0
  596. # Lotus Multi Byte Character Set (LMBCS=1-31)
  597. >20 ubyte >0
  598. >>20 ubyte <32 Lotus 1-2-3
  599. #!:mime application/x-123
  600. !:mime application/vnd.lotus-1-2-3
  601. !:apple ????L123
  602. # (version 5.26) labeled the entry as "Lotus 1-2-3 wk3 document data"
  603. >>>4 uleshort 0x1000 WorKsheet, version 3
  604. !:ext wk3
  605. # (version 5.26) labeled the entry as "Lotus 1-2-3 wk4 document data"
  606. >>>4 uleshort 0x1002 WorKsheet, version 4
  607. # also worksheet template 4 (.wt4)
  608. !:ext wk4/wt4
  609. # no example or documentation for wk5
  610. #>>4 uleshort 0x???? WorKsheet, version 4
  611. #!:ext wk5
  612. # only MacrotoScript.123 example
  613. >>>4 uleshort 0x1003 WorKsheet, version 97
  614. # also worksheet template Smartmaster (.12M)?
  615. !:ext 123
  616. # only Set_Y2K.123 example
  617. >>>4 uleshort 0x1005 WorKsheet, version 9.8 Millennium
  618. !:ext 123
  619. # no example for this version
  620. >>>4 uleshort 0x8001 FoRMatting data
  621. !:ext frm
  622. # (version 5.26) labeled the entry as "Lotus 1-2-3 fm3 or fmb document data"
  623. # TrID labeles the entry as "Formatting Data for Lotus 1-2-3 worksheet"
  624. >>>4 uleshort 0x8007 ForMatting data, version 3
  625. !:ext fm3
  626. >>>4 default x unknown
  627. # file revision sub code 0004h for worksheets
  628. >>>>6 uleshort =0x0004 worksheet
  629. !:ext wXX
  630. >>>>6 uleshort !0x0004 formatting data
  631. !:ext fXX
  632. # main revision number
  633. >>>>4 uleshort x \b, revision 0x%x
  634. >>>6 uleshort =0x0004 \b, cell range
  635. # active cellcoord range (start row, page,column ; end row, page, column)
  636. # start values normally 0~1st sheet A1
  637. >>>>8 ulelong !0
  638. >>>>>10 ubyte >0 \b%d*
  639. >>>>>8 uleshort x \b%d,
  640. >>>>>11 ubyte x \b%d-
  641. # end page mostly 0
  642. >>>>14 ubyte >0 \b%d*
  643. # end raw, column normally not 0
  644. >>>>12 uleshort x \b%d,
  645. >>>>15 ubyte x \b%d
  646. # Lotus Multi Byte Character Set (1~cp850,2~cp851,...,16~japan,...,31~??)
  647. >>>>20 ubyte >1 \b, character set 0x%x
  648. # flags
  649. >>>>21 ubyte x \b, flags 0x%x
  650. >>>6 uleshort !0x0004
  651. # record type (FONTNAME=00AEh)
  652. >>>>30 search/29 \0\xAE
  653. # variable length m (2) + entries (1) + ?? (1) + LCMBS string (n)
  654. >>>>>&4 string >\0 \b, 1st font "%s"
  655. #
  656. # Update: Joerg Jenderek
  657. # URL: http://fileformats.archiveteam.org/wiki/Lotus_1-2-3
  658. # Reference: http://www.schnarff.com/file-formats/lotus-1-2-3/WSFF2.TXT
  659. # Note: Used by both old Lotus 1-2-3 and Lotus Symphony (DOS) til version 2.x
  660. # record type (BeginningOfFile=0000h) + length (0002h)
  661. 0 belong 0x00000200
  662. # GRR: line above is too general as it catches also MS Windows CURsor
  663. # to display MS Windows cursor (strength=70) before Lotus 1-2-3 (strength=70-1)
  664. !:strength -1
  665. # skip Windows cursors with image height <256 and keep Lotus with low opcode 0001-0083h
  666. >7 ubyte 0
  667. # skip Windows cursors with image width 256 and keep Lotus with positiv opcode
  668. >>6 ubyte >0 Lotus
  669. # !:mime application/x-123
  670. !:mime application/vnd.lotus-1-2-3
  671. !:apple ????L123
  672. # revision number (0404h = 123 1A, 0405h = Lotus Symphony , 0406h = 123 2.x wk1 , 8006h = fmt , ...)
  673. # undocumented; (version 5.26) labeled the configurations as "Lotus 1-2-3"
  674. >>>4 uleshort 0x0007 1-2-3 CoNFiguration, version 2.x (PGRAPH.CNF)
  675. !:ext cnf
  676. >>>4 uleshort 0x0C05 1-2-3 CoNFiguration, version 2.4J
  677. !:ext cnf
  678. >>>4 uleshort 0x0801 1-2-3 CoNFiguration, version 1-2.1
  679. !:ext cnf
  680. >>>4 uleshort 0x0802 Symphony CoNFiguration
  681. !:ext cnf
  682. >>>4 uleshort 0x0804 1-2-3 CoNFiguration, version 2.2
  683. !:ext cnf
  684. >>>4 uleshort 0x080A 1-2-3 CoNFiguration, version 2.3-2.4
  685. !:ext cnf
  686. >>>4 uleshort 0x1402 1-2-3 CoNFiguration, version 3.x
  687. !:ext cnf
  688. >>>4 uleshort 0x1450 1-2-3 CoNFiguration, version 4.x
  689. !:ext cnf
  690. # (version 5.26) labeled the entry as "Lotus 123"
  691. # TrID labeles the entry as "Lotus 123 Worksheet (generic)"
  692. >>>4 uleshort 0x0404 1-2-3 WorKSheet, version 1
  693. # extension "wks" also for Microsoft Works document
  694. !:ext wks
  695. # (version 5.26) labeled the entry as "Lotus 123"
  696. # TrID labeles the entry as "Lotus 123 Worksheet (generic)"
  697. >>>4 uleshort 0x0405 Symphony WoRksheet, version 1.0
  698. !:ext wrk/wr1
  699. # (version 5.26) labeled the entry as "Lotus 1-2-3 wk1 document data"
  700. # TrID labeles the entry as "Lotus 123 Worksheet (V2)"
  701. >>>4 uleshort 0x0406 1-2-3/Symphony worksheet, version 2
  702. # Symphony (.wr1)
  703. !:ext wk1/wr1
  704. # no example for this japan version
  705. >>>4 uleshort 0x0600 1-2-3 WorKsheet, version 1.xJ
  706. !:ext wj1
  707. # no example or documentation for wk2
  708. #>>>4 uleshort 0x???? 1-2-3 WorKsheet, version 2
  709. #!:ext wk2
  710. # undocumented japan version
  711. >>>4 uleshort 0x0602 1-2-3 worksheet, version 2.4J
  712. !:ext wj3
  713. # (version 5.26) labeled the entry as "Lotus 1-2-3 fmt document data"
  714. >>>4 uleshort 0x8006 1-2-3 ForMaTting data, version 2.x
  715. # japan version 2.4J (fj3)
  716. !:ext fmt/fj3
  717. # no example for this version
  718. >>>4 uleshort 0x8007 1-2-3 FoRMatting data, version 2.0
  719. !:ext frm
  720. # (version 5.26) labeled the entry as "Lotus 1-2-3"
  721. >>>4 default x unknown worksheet or configuration
  722. !:ext cnf
  723. >>>>4 uleshort x \b, revision 0x%x
  724. # 2nd record for most worksheets describes cells range
  725. >>>6 use lotus-cells
  726. # 3nd record for most japan worksheets describes cells range
  727. >>>(8.s+10) use lotus-cells
  728. # check and then display Lotus worksheet cells range
  729. 0 name lotus-cells
  730. # look for type (RANGE=0006h) + length (0008h) at record begin
  731. >0 ubelong 0x06000800 \b, cell range
  732. # cell range (start column, row, end column, row) start values normally 0,0~A1 cell
  733. >>4 ulong !0
  734. >>>4 uleshort x \b%d,
  735. >>>6 uleshort x \b%d-
  736. # end of cell range
  737. >>8 uleshort x \b%d,
  738. >>10 uleshort x \b%d
  739. # EndOfLotus123
  740. 0 string/b WordPro\0 Lotus WordPro
  741. !:mime application/vnd.lotus-wordpro
  742. 0 string/b WordPro\r\373 Lotus WordPro
  743. !:mime application/vnd.lotus-wordpro
  744. # Summary: Script used by InstallScield to uninstall applications
  745. # Extension: .isu
  746. # Submitted by: unknown
  747. # Modified by (1): Abel Cheung <abelcheung@gmail.com> (replace useless entry)
  748. 0 string \x71\xa8\x00\x00\x01\x02
  749. >12 string Stirling\ Technologies, InstallShield Uninstall Script
  750. # Winamp .avs
  751. #0 string Nullsoft\ AVS\ Preset\ \060\056\061\032 A plug in for Winamp ms-windows Freeware media player
  752. 0 string/b Nullsoft\ AVS\ Preset\ Winamp plug in
  753. # Windows Metafont .WMF
  754. 0 string/b \327\315\306\232 ms-windows metafont .wmf
  755. 0 string/b \002\000\011\000 ms-windows metafont .wmf
  756. 0 string/b \001\000\011\000 ms-windows metafont .wmf
  757. #tz3 files whatever that is (MS Works files)
  758. 0 string/b \003\001\001\004\070\001\000\000 tz3 ms-works file
  759. 0 string/b \003\002\001\004\070\001\000\000 tz3 ms-works file
  760. 0 string/b \003\003\001\004\070\001\000\000 tz3 ms-works file
  761. # PGP sig files .sig
  762. #0 string \211\000\077\003\005\000\063\237\127 065 to \027\266\151\064\005\045\101\233\021\002 PGP sig
  763. 0 string \211\000\077\003\005\000\063\237\127\065\027\266\151\064\005\045\101\233\021\002 PGP sig
  764. 0 string \211\000\077\003\005\000\063\237\127\066\027\266\151\064\005\045\101\233\021\002 PGP sig
  765. 0 string \211\000\077\003\005\000\063\237\127\067\027\266\151\064\005\045\101\233\021\002 PGP sig
  766. 0 string \211\000\077\003\005\000\063\237\127\070\027\266\151\064\005\045\101\233\021\002 PGP sig
  767. 0 string \211\000\077\003\005\000\063\237\127\071\027\266\151\064\005\045\101\233\021\002 PGP sig
  768. 0 string \211\000\225\003\005\000\062\122\207\304\100\345\042 PGP sig
  769. # windows zips files .dmf
  770. 0 string/b MDIF\032\000\010\000\000\000\372\046\100\175\001\000\001\036\001\000 MS Windows special zipped file
  771. #ico files
  772. 0 string/b \102\101\050\000\000\000\056\000\000\000\000\000\000\000 Icon for MS Windows
  773. # Windows icons
  774. # Update: Joerg Jenderek
  775. # URL: https://en.wikipedia.org/wiki/CUR_(file_format)
  776. # Note: similiar to Windows CURsor. container for BMP (only DIB part) or PNG
  777. 0 belong 0x00000100
  778. >9 byte 0
  779. >>0 byte x
  780. >>0 use cur-ico-dir
  781. >9 ubyte 0xff
  782. >>0 byte x
  783. >>0 use cur-ico-dir
  784. # displays number of icons and information for icon or cursor
  785. 0 name cur-ico-dir
  786. # skip some Lotus 1-2-3 worksheets, CYCLE.PIC and keep Windows cursors with
  787. # 1st data offset = dir header size + n * dir entry size = 6 + n * 10h = ?6h
  788. >18 ulelong &0x00000006
  789. # skip remaining worksheets, because valid only for DIB image (40) or PNG image (\x89PNG)
  790. >>(18.l) ulelong x MS Windows
  791. >>>0 ubelong 0x00000100 icon resource
  792. #!:mime image/vnd.microsoft.icon
  793. !:mime image/x-icon
  794. !:ext ico
  795. >>>>4 uleshort x - %d icon
  796. # plural s
  797. >>>>4 uleshort >1 \bs
  798. # 1st icon
  799. >>>>0x06 use ico-entry
  800. # 2nd icon
  801. >>>>4 uleshort >1
  802. >>>>>0x16 use ico-entry
  803. >>>0 ubelong 0x00000200 cursor resource
  804. #!:mime image/x-cur
  805. !:mime image/x-win-bitmap
  806. !:ext cur
  807. >>>>4 uleshort x - %d icon
  808. >>>>4 uleshort >1 \bs
  809. # 1st cursor
  810. >>>>0x06 use cur-entry
  811. #>>>>0x16 use cur-entry
  812. # display information of one cursor entry
  813. 0 name cur-entry
  814. >0 use cur-ico-entry
  815. >4 uleshort x \b, hotspot @%dx
  816. >6 uleshort x \b%d
  817. # display information of one icon entry
  818. 0 name ico-entry
  819. >0 use cur-ico-entry
  820. # normally 0 1 but also found 14
  821. >4 uleshort >1 \b, %d planes
  822. # normally 0 1 but also found some 3, 4, some 6, 8, 24, many 32, two 256
  823. >6 uleshort >1 \b, %d bits/pixel
  824. # display shared information of cursor or icon entry
  825. 0 name cur-ico-entry
  826. >0 byte =0 \b, 256x
  827. >0 byte !0 \b, %dx
  828. >1 byte =0 \b256
  829. >1 byte !0 \b%d
  830. # number of colors in palette
  831. >2 ubyte !0 \b, %d colors
  832. # reserved 0 FFh
  833. #>3 ubyte x \b, reserved %x
  834. #>8 ulelong x \b, image size %d
  835. # offset of PNG or DIB image
  836. #>12 ulelong x \b, offset 0x%x
  837. # PNG header (\x89PNG)
  838. >(12.l) ubelong =0x89504e47
  839. >>&-4 indirect x \b with
  840. # DIB image
  841. >(12.l) ubelong !0x89504e47
  842. #>>&-4 use dib-image
  843. # Windows non-animated cursors
  844. # Update: Joerg Jenderek
  845. # URL: https://en.wikipedia.org/wiki/CUR_(file_format)
  846. # Note: similiar to Windows ICOn. container for BMP ( only DIB part)
  847. # GRR: line below is too general as it catches also Lotus 1-2-3 files
  848. 0 belong 0x00000200
  849. >9 byte 0
  850. >>0 use cur-ico-dir
  851. >9 ubyte 0xff
  852. >>0 use cur-ico-dir
  853. # .chr files
  854. 0 string/b PK\010\010BGI Borland font
  855. >4 string >\0 %s
  856. # then there is a copyright notice
  857. # .bgi files
  858. 0 string/b pk\010\010BGI Borland device
  859. >4 string >\0 %s
  860. # then there is a copyright notice
  861. # Windows Recycle Bin record file (named INFO2)
  862. # By Abel Cheung (abelcheung AT gmail dot com)
  863. # Version 4 always has 280 bytes (0x118) per record, version 5 has 800 bytes
  864. # Since Vista uses another structure, INFO2 structure probably won't change
  865. # anymore. Detailed analysis in:
  866. # http://www.cybersecurityinstitute.biz/downloads/INFO2.pdf
  867. 0 lelong 0x00000004
  868. >12 lelong 0x00000118 Windows Recycle Bin INFO2 file (Win98 or below)
  869. 0 lelong 0x00000005
  870. >12 lelong 0x00000320 Windows Recycle Bin INFO2 file (Win2k - WinXP)
  871. # From Doug Lee via a FreeBSD pr
  872. 9 string GERBILDOC First Choice document
  873. 9 string GERBILDB First Choice database
  874. 9 string GERBILCLIP First Choice database
  875. 0 string GERBIL First Choice device file
  876. 9 string RABBITGRAPH RabbitGraph file
  877. 0 string DCU1 Borland Delphi .DCU file
  878. 0 string =!<spell> MKS Spell hash list (old format)
  879. 0 string =!<spell2> MKS Spell hash list
  880. # Too simple - MPi
  881. #0 string AH Halo(TM) bitmapped font file
  882. 0 lelong 0x08086b70 TurboC BGI file
  883. 0 lelong 0x08084b50 TurboC Font file
  884. # Debian#712046: The magic below identifies "Delphi compiled form data".
  885. # An additional source of information is available at:
  886. # http://www.woodmann.com/fravia/dafix_t1.htm
  887. 0 string TPF0
  888. >4 pstring >\0 Delphi compiled form '%s'
  889. # tests for DBase files moved, updated and merged to database
  890. 0 string PMCC Windows 3.x .GRP file
  891. 1 string RDC-meg MegaDots
  892. >8 byte >0x2F version %c
  893. >9 byte >0x2F \b.%c file
  894. 0 lelong 0x4C
  895. >4 lelong 0x00021401 Windows shortcut file
  896. # .PIF files added by Joerg Jenderek from http://smsoft.ru/en/pifdoc.htm
  897. # only for windows versions equal or greater 3.0
  898. 0x171 string MICROSOFT\ PIFEX\0 Windows Program Information File
  899. !:mime application/x-dosexec
  900. #>2 string >\0 \b, Title:%.30s
  901. >0x24 string >\0 \b for %.63s
  902. >0x65 string >\0 \b, directory=%.64s
  903. >0xA5 string >\0 \b, parameters=%.64s
  904. #>0x181 leshort x \b, offset %x
  905. #>0x183 leshort x \b, offsetdata %x
  906. #>0x185 leshort x \b, section length %x
  907. >0x187 search/0xB55 WINDOWS\ VMM\ 4.0\0
  908. >>&0x5e ubyte >0
  909. >>>&-1 string <PIFMGR.DLL \b, icon=%s
  910. #>>>&-1 string PIFMGR.DLL \b, icon=%s
  911. >>>&-1 string >PIFMGR.DLL \b, icon=%s
  912. >>&0xF0 ubyte >0
  913. >>>&-1 string <Terminal \b, font=%.32s
  914. #>>>&-1 string =Terminal \b, font=%.32s
  915. >>>&-1 string >Terminal \b, font=%.32s
  916. >>&0x110 ubyte >0
  917. >>>&-1 string <Lucida\ Console \b, TrueTypeFont=%.32s
  918. #>>>&-1 string =Lucida\ Console \b, TrueTypeFont=%.32s
  919. >>>&-1 string >Lucida\ Console \b, TrueTypeFont=%.32s
  920. #>0x187 search/0xB55 WINDOWS\ 286\ 3.0\0 \b, Windows 3.X standard mode-style
  921. #>0x187 search/0xB55 WINDOWS\ 386\ 3.0\0 \b, Windows 3.X enhanced mode-style
  922. >0x187 search/0xB55 WINDOWS\ NT\ \ 3.1\0 \b, Windows NT-style
  923. #>0x187 search/0xB55 WINDOWS\ NT\ \ 4.0\0 \b, Windows NT-style
  924. >0x187 search/0xB55 CONFIG\ \ SYS\ 4.0\0 \b +CONFIG.SYS
  925. #>>&06 string x \b:%s
  926. >0x187 search/0xB55 AUTOEXECBAT\ 4.0\0 \b +AUTOEXEC.BAT
  927. #>>&06 string x \b:%s
  928. # DOS EPS Binary File Header
  929. # From: Ed Sznyter <ews@Black.Market.NET>
  930. 0 belong 0xC5D0D3C6 DOS EPS Binary File
  931. !:mime image/x-eps
  932. >4 long >0 Postscript starts at byte %d
  933. >>8 long >0 length %d
  934. >>>12 long >0 Metafile starts at byte %d
  935. >>>>16 long >0 length %d
  936. >>>20 long >0 TIFF starts at byte %d
  937. >>>>24 long >0 length %d
  938. # TNEF magic From "Joomy" <joomy@se-ed.net>
  939. # Microsoft Outlook's Transport Neutral Encapsulation Format (TNEF)
  940. 0 leshort 0x223e9f78 TNEF
  941. !:mime application/vnd.ms-tnef
  942. # Norton Guide (.NG , .HLP) files added by Joerg Jenderek from source NG2HTML.C
  943. # of http://www.davep.org/norton-guides/ng2h-105.tgz
  944. # http://en.wikipedia.org/wiki/Norton_Guides
  945. 0 string NG\0\001
  946. # only value 0x100 found at offset 2
  947. >2 ulelong 0x00000100 Norton Guide
  948. # Title[40]
  949. >>8 string >\0 "%-.40s"
  950. #>>6 uleshort x \b, MenuCount=%u
  951. # szCredits[5][66]
  952. >>48 string >\0 \b, %-.66s
  953. >>114 string >\0 %-.66s
  954. # 4DOS help (.HLP) files added by Joerg Jenderek from source TPHELP.PAS
  955. # of http://www.4dos.info/
  956. # pointer,HelpID[8]=4DHnnnmm
  957. 0 ulelong 0x48443408 4DOS help file
  958. >4 string x \b, version %-4.4s
  959. # old binary Microsoft (.HLP) files added by Joerg Jenderek from http://file-extension.net/seeker/file_extension_hlp
  960. 0 ulequad 0x3a000000024e4c MS Advisor help file
  961. # HtmlHelp files (.chm)
  962. 0 string/b ITSF\003\000\000\000\x60\000\000\000 MS Windows HtmlHelp Data
  963. # GFA-BASIC (Wolfram Kleff)
  964. 2 string/b GFA-BASIC3 GFA-BASIC 3 data
  965. #------------------------------------------------------------------------------
  966. # From Stuart Caie <kyzer@4u.net> (developer of cabextract)
  967. # Microsoft Cabinet files
  968. 0 string/b MSCF\0\0\0\0 Microsoft Cabinet archive data
  969. !:mime application/vnd.ms-cab-compressed
  970. >8 lelong x \b, %u bytes
  971. >28 leshort 1 \b, 1 file
  972. >28 leshort >1 \b, %u files
  973. # InstallShield Cabinet files
  974. 0 string/b ISc( InstallShield Cabinet archive data
  975. >5 byte&0xf0 =0x60 version 6,
  976. >5 byte&0xf0 !0x60 version 4/5,
  977. >(12.l+40) lelong x %u files
  978. # Windows CE package files
  979. 0 string/b MSCE\0\0\0\0 Microsoft WinCE install header
  980. >20 lelong 0 \b, architecture-independent
  981. >20 lelong 103 \b, Hitachi SH3
  982. >20 lelong 104 \b, Hitachi SH4
  983. >20 lelong 0xA11 \b, StrongARM
  984. >20 lelong 4000 \b, MIPS R4000
  985. >20 lelong 10003 \b, Hitachi SH3
  986. >20 lelong 10004 \b, Hitachi SH3E
  987. >20 lelong 10005 \b, Hitachi SH4
  988. >20 lelong 70001 \b, ARM 7TDMI
  989. >52 leshort 1 \b, 1 file
  990. >52 leshort >1 \b, %u files
  991. >56 leshort 1 \b, 1 registry entry
  992. >56 leshort >1 \b, %u registry entries
  993. # Windows Enhanced Metafile (EMF)
  994. # See msdn.microsoft.com/archive/en-us/dnargdi/html/msdn_enhmeta.asp
  995. # for further information.
  996. 0 ulelong 1
  997. >40 string \ EMF Windows Enhanced Metafile (EMF) image data
  998. >>44 ulelong x version 0x%x
  999. # from http://filext.com by Derek M Jones <derek@knosof.co.uk>
  1000. # False positive with PPT (also currently this string is too long)
  1001. #0 string/b \xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x3E\x00\x03\x00\xFE\xFF\x09\x00\x06 Microsoft Installer
  1002. 0 string/b \320\317\021\340\241\261\032\341 Microsoft Office Document
  1003. #>48 byte 0x1B Excel Document
  1004. #!:mime application/vnd.ms-excel
  1005. >546 string bjbj Microsoft Word Document
  1006. !:mime application/msword
  1007. >546 string jbjb Microsoft Word Document
  1008. !:mime application/msword
  1009. 0 string/b \224\246\056 Microsoft Word Document
  1010. !:mime application/msword
  1011. 512 string R\0o\0o\0t\0\ \0E\0n\0t\0r\0y Microsoft Word Document
  1012. !:mime application/msword
  1013. # From: "Nelson A. de Oliveira" <naoliv@gmail.com>
  1014. # Magic type for Dell's BIOS .hdr files
  1015. # Dell's .hdr
  1016. 0 string/b $RBU
  1017. >23 string Dell %s system BIOS
  1018. >5 byte 2
  1019. >>48 byte x version %d.
  1020. >>49 byte x \b%d.
  1021. >>50 byte x \b%d
  1022. >5 byte <2
  1023. >>48 string x version %.3s
  1024. # Type: Microsoft DirectDraw Surface
  1025. # URL: http://msdn.microsoft.com/library/default.asp?url=/library/en-us/directx9_c/directx/graphics/reference/DDSFileReference/ddsfileformat.asp
  1026. # From: Morten Hustveit <morten@debian.org>
  1027. 0 string/b DDS\040\174\000\000\000 Microsoft DirectDraw Surface (DDS),
  1028. >16 lelong >0 %d x
  1029. >12 lelong >0 %d,
  1030. >84 string x %.4s
  1031. # Type: Microsoft Document Imaging Format (.mdi)
  1032. # URL: http://en.wikipedia.org/wiki/Microsoft_Document_Imaging_Format
  1033. # From: Daniele Sempione <scrows@oziosi.org>
  1034. # Too weak (EP)
  1035. #0 short 0x5045 Microsoft Document Imaging Format
  1036. # MS eBook format (.lit)
  1037. 0 string/b ITOLITLS Microsoft Reader eBook Data
  1038. >8 lelong x \b, version %u
  1039. !:mime application/x-ms-reader
  1040. # Windows CE Binary Image Data Format
  1041. # From: Dr. Jesus <j@hug.gs>
  1042. 0 string/b B000FF\n Windows Embedded CE binary image
  1043. # Windows Imaging (WIM) Image
  1044. 0 string/b MSWIM\000\000\000 Windows imaging (WIM) image
  1045. 0 string/b WLPWM\000\000\000 Windows imaging (WIM) image, wimlib pipable format
  1046. # The second byte of these signatures is a file version; I don't know what,
  1047. # if anything, produced files with version numbers 0-2.
  1048. # From: John Elliott <johne@seasip.demon.co.uk>
  1049. 0 string \xfc\x03\x00 Mallard BASIC program data (v1.11)
  1050. 0 string \xfc\x04\x00 Mallard BASIC program data (v1.29+)
  1051. 0 string \xfc\x03\x01 Mallard BASIC protected program data (v1.11)
  1052. 0 string \xfc\x04\x01 Mallard BASIC protected program data (v1.29+)
  1053. 0 string MIOPEN Mallard BASIC Jetsam data
  1054. 0 string Jetsam0 Mallard BASIC Jetsam index data
  1055. # DOS backup 2.0 to 3.2
  1056. # backupid.@@@
  1057. # plausibility check for date
  1058. 0x3 ushort >1979
  1059. >0x5 ubyte-1 <31
  1060. >>0x6 ubyte-1 <12
  1061. # actually 121 nul bytes
  1062. >>>0x7 string \0\0\0\0\0\0\0\0
  1063. >>>>0x1 ubyte x DOS 2.0 backup id file, sequence %d
  1064. !:ext @@@
  1065. >>>>0x0 ubyte 0xff \b, last disk
  1066. # backed up file
  1067. # skip some AppleWorks word like Tomahawk.Awp, WIN98SE-DE.vhd
  1068. # by looking for trailing nul of maximal file name string
  1069. 0x52 ubyte 0
  1070. # test for flag byte: FFh~complete file, 00h~split file
  1071. # FFh -127 = -1 -127 = -128
  1072. # 00h -127 = 0 -127 = -127
  1073. >0 byte-127 <-126
  1074. # plausibility check for file name length
  1075. >>0x53 ubyte-1 <78
  1076. # looking for terminating nul of file name string
  1077. >>>(0x53.b+4) ubyte 0
  1078. # looking if last char of string is valid DOS file name
  1079. >>>>(0x53.b+3) ubyte >0x1F
  1080. # actually 44 nul bytes
  1081. # but sometimes garbage according to Ralf Quint. So can not be used as test
  1082. #>0x54 string \0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0
  1083. # first char of full file name is DOS (5Ch) or UNIX (2Fh) path separator
  1084. # only DOS variant found. UNIX variant according to V32SLASH.TXT in archive PD0315.EXE
  1085. >>>>>5 ubyte&0x8C 0x0C
  1086. # ./msdos (version 5.30) labeled the entry as
  1087. # "DOS 2.0 backed up file %s, split file, sequence %d" or
  1088. # "DOS 2.0 backed up file %s, complete file"
  1089. >>>>>>0 ubyte x DOS 2.0-3.2 backed up
  1090. #>>>>>>0 ubyte 0xff complete
  1091. >>>>>>0 ubyte 0
  1092. >>>>>>>1 uleshort x sequence %d of
  1093. # full file name with path but without drive letter and colon stored from 0x05 til 0x52
  1094. >>>>>>0x5 string x file %s
  1095. # backup name is original filename
  1096. #!:ext *
  1097. # magic/Magdir/msdos, 1169: Warning: EXTENSION type ` *' has bad char '*'
  1098. # file: line 1169: Bad magic entry ' *'
  1099. # after header original file content
  1100. >>>>>>128 indirect x \b;
  1101. # DOS backup 3.3 to 5.x
  1102. # CONTROL.nnn files
  1103. 0 string \x8bBACKUP\x20
  1104. # actually 128 nul bytes
  1105. >0xa string \0\0\0\0\0\0\0\0
  1106. >>0x9 ubyte x DOS 3.3 backup control file, sequence %d
  1107. >>0x8a ubyte 0xff \b, last disk
  1108. # NB: The BACKUP.nnn files consist of the files backed up,
  1109. # concatenated.