msdos 27 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715
  1. #------------------------------------------------------------------------------
  2. # msdos: file(1) magic for MS-DOS files
  3. #
  4. # .BAT files (Daniel Quinlan, quinlan@yggdrasil.com)
  5. # updated by Joerg Jenderek at Oct 2008
  6. 0 string @
  7. >1 string/cB \ echo\ off DOS batch file text
  8. !:mime text/x-msdos-batch
  9. >1 string/cB echo\ off DOS batch file text
  10. !:mime text/x-msdos-batch
  11. >1 string/cB rem\ DOS batch file text
  12. !:mime text/x-msdos-batch
  13. >1 string/cB set\ DOS batch file text
  14. !:mime text/x-msdos-batch
  15. # OS/2 batch files are REXX. the second regex is a bit generic, oh well
  16. # the matched commands seem to be common in REXX and uncommon elsewhere
  17. 100 regex/c =^[\ \t]{0,10}call[\ \t]{1,10}rxfunc OS/2 REXX batch file text
  18. 100 regex/c =^[\ \t]{0,10}say\ ['"] OS/2 REXX batch file text
  19. 0 leshort 0x14c MS Windows COFF Intel 80386 object file
  20. #>4 ledate x stamp %s
  21. 0 leshort 0x166 MS Windows COFF MIPS R4000 object file
  22. #>4 ledate x stamp %s
  23. 0 leshort 0x184 MS Windows COFF Alpha object file
  24. #>4 ledate x stamp %s
  25. 0 leshort 0x268 MS Windows COFF Motorola 68000 object file
  26. #>4 ledate x stamp %s
  27. 0 leshort 0x1f0 MS Windows COFF PowerPC object file
  28. #>4 ledate x stamp %s
  29. 0 leshort 0x290 MS Windows COFF PA-RISC object file
  30. #>4 ledate x stamp %s
  31. # XXX - according to Microsoft's spec, at an offset of 0x3c in a
  32. # PE-format executable is the offset in the file of the PE header;
  33. # unfortunately, that's a little-endian offset, and there's no way
  34. # to specify an indirect offset with a specified byte order.
  35. # So, for now, we assume the standard MS-DOS stub, which puts the
  36. # PE header at 0x80 = 128.
  37. #
  38. # Required OS version and subsystem version were 4.0 on some NT 3.51
  39. # executables built with Visual C++ 4.0, so it's not clear that
  40. # they're interesting. The user version was 0.0, but there's
  41. # probably some linker directive to set it. The linker version was
  42. # 3.0, except for one ".exe" which had it as 4.20 (same damn linker!).
  43. #
  44. # many of the compressed formats were extraced from IDARC 1.23 source code
  45. #
  46. 0 string MZ
  47. !:mime application/x-dosexec
  48. >0x18 leshort <0x40 MS-DOS executable
  49. >0 string MZ\0\0\0\0\0\0\0\0\0\0PE\0\0 \b, PE for MS Windows
  50. >>&18 leshort&0x2000 >0 (DLL)
  51. >>&88 leshort 0 (unknown subsystem)
  52. >>&88 leshort 1 (native)
  53. >>&88 leshort 2 (GUI)
  54. >>&88 leshort 3 (console)
  55. >>&88 leshort 7 (POSIX)
  56. >>&0 leshort 0x0 unknown processor
  57. >>&0 leshort 0x14c Intel 80386
  58. >>&0 leshort 0x166 MIPS R4000
  59. >>&0 leshort 0x184 Alpha
  60. >>&0 leshort 0x268 Motorola 68000
  61. >>&0 leshort 0x1f0 PowerPC
  62. >>&0 leshort 0x290 PA-RISC
  63. >>&18 leshort&0x0100 >0 32-bit
  64. >>&18 leshort&0x1000 >0 system file
  65. >>&0xf4 search/0x140 \x0\x40\x1\x0
  66. >>>(&0.l+(4)) string MSCF \b, WinHKI CAB self-extracting archive
  67. >30 string Copyright\ 1989-1990\ PKWARE\ Inc. Self-extracting PKZIP archive
  68. !:mime application/zip
  69. # Is next line correct? One might expect "Corp." not "Copr." If it is right, add a note to that effect.
  70. >30 string PKLITE\ Copr. Self-extracting PKZIP archive
  71. !:mime application/zip
  72. >0x18 leshort >0x3f
  73. >>(0x3c.l) string PE\0\0 PE
  74. >>>(0x3c.l+25) byte 1 \b32 executable
  75. >>>(0x3c.l+25) byte 2 \b32+ executable
  76. # hooray, there's a DOS extender using the PE format, with a valid PE
  77. # executable inside (which just prints a message and exits if run in win)
  78. >>>(0x3c.l+92) leshort <10
  79. >>>>(8.s*16) string 32STUB for MS-DOS, 32rtm DOS extender
  80. >>>>(8.s*16) string !32STUB for MS Windows
  81. >>>>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
  82. >>>>>(0x3c.l+92) leshort 0 (unknown subsystem)
  83. >>>>>(0x3c.l+92) leshort 1 (native)
  84. >>>>>(0x3c.l+92) leshort 2 (GUI)
  85. >>>>>(0x3c.l+92) leshort 3 (console)
  86. >>>>>(0x3c.l+92) leshort 7 (POSIX)
  87. >>>(0x3c.l+92) leshort 10 (EFI application)
  88. >>>(0x3c.l+92) leshort 11 (EFI boot service driver)
  89. >>>(0x3c.l+92) leshort 12 (EFI runtime driver)
  90. >>>(0x3c.l+92) leshort 13 (XBOX)
  91. >>>(0x3c.l+4) leshort 0x0 unknown processor
  92. >>>(0x3c.l+4) leshort 0x14c Intel 80386
  93. >>>(0x3c.l+4) leshort 0x166 MIPS R4000
  94. >>>(0x3c.l+4) leshort 0x184 Alpha
  95. >>>(0x3c.l+4) leshort 0x268 Motorola 68000
  96. >>>(0x3c.l+4) leshort 0x1f0 PowerPC
  97. >>>(0x3c.l+4) leshort 0x290 PA-RISC
  98. >>>(0x3c.l+4) leshort 0x200 Intel Itanium
  99. >>>(0x3c.l+22) leshort&0x0100 >0 32-bit
  100. >>>(0x3c.l+22) leshort&0x1000 >0 system file
  101. >>>(0x3c.l+232) lelong >0 Mono/.Net assembly
  102. >>>>(0x3c.l+0xf8) string UPX0 \b, UPX compressed
  103. >>>>(0x3c.l+0xf8) search/0x140 PEC2 \b, PECompact2 compressed
  104. >>>>(0x3c.l+0xf8) search/0x140 UPX2
  105. >>>>>(&0x10.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
  106. >>>>(0x3c.l+0xf8) search/0x140 .idata
  107. >>>>>(&0xe.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
  108. >>>>>(&0xe.l+(-4)) string ZZ0 \b, ZZip self-extracting archive
  109. >>>>>(&0xe.l+(-4)) string ZZ1 \b, ZZip self-extracting archive
  110. >>>>(0x3c.l+0xf8) search/0x140 .rsrc
  111. >>>>>(&0x0f.l+(-4)) string a\\\4\5 \b, WinHKI self-extracting archive
  112. >>>>>(&0x0f.l+(-4)) string Rar! \b, RAR self-extracting archive
  113. >>>>>(&0x0f.l+(-4)) search/0x3000 MSCF \b, InstallShield self-extracting archive
  114. >>>>>(&0x0f.l+(-4)) search/32 Nullsoft \b, Nullsoft Installer self-extracting archive
  115. >>>>(0x3c.l+0xf8) search/0x140 .data
  116. >>>>>(&0x0f.l) string WEXTRACT \b, MS CAB-Installer self-extracting archive
  117. >>>>(0x3c.l+0xf8) search/0x140 .petite\0 \b, Petite compressed
  118. >>>>>(0x3c.l+0xf7) byte x
  119. >>>>>>(&0x104.l+(-4)) string =!sfx! \b, ACE self-extracting archive
  120. >>>>(0x3c.l+0xf8) search/0x140 .WISE \b, WISE installer self-extracting archive
  121. >>>>(0x3c.l+0xf8) search/0x140 .dz\0\0\0 \b, Dzip self-extracting archive
  122. >>>>(0x3c.l+0xf8) search/0x140 .reloc
  123. >>>>>(&0xe.l+(-4)) search/0x180 PK\3\4 \b, ZIP self-extracting archive (WinZip)
  124. >>>>&(0x3c.l+0xf8) search/0x100 _winzip_ \b, ZIP self-extracting archive (WinZip)
  125. >>>>&(0x3c.l+0xf8) search/0x100 SharedD \b, Microsoft Installer self-extracting archive
  126. >>>>0x30 string Inno \b, InnoSetup self-extracting archive
  127. >>(0x3c.l) string !PE\0\0 MS-DOS executable
  128. >>(0x3c.l) string NE \b, NE
  129. >>>(0x3c.l+0x36) byte 0 (unknown OS)
  130. >>>(0x3c.l+0x36) byte 1 for OS/2 1.x
  131. >>>(0x3c.l+0x36) byte 2 for MS Windows 3.x
  132. >>>(0x3c.l+0x36) byte 3 for MS-DOS
  133. >>>(0x3c.l+0x36) byte >3 (unknown OS)
  134. >>>(0x3c.l+0x36) byte 0x81 for MS-DOS, Phar Lap DOS extender
  135. >>>(0x3c.l+0x0c) leshort&0x8003 0x8002 (DLL)
  136. >>>(0x3c.l+0x0c) leshort&0x8003 0x8001 (driver)
  137. >>>&(&0x24.s-1) string ARJSFX \b, ARJ self-extracting archive
  138. >>>(0x3c.l+0x70) search/0x80 WinZip(R)\ Self-Extractor \b, ZIP self-extracting archive (WinZip)
  139. >>(0x3c.l) string LX\0\0 \b, LX
  140. >>>(0x3c.l+0x0a) leshort <1 (unknown OS)
  141. >>>(0x3c.l+0x0a) leshort 1 for OS/2
  142. >>>(0x3c.l+0x0a) leshort 2 for MS Windows
  143. >>>(0x3c.l+0x0a) leshort 3 for DOS
  144. >>>(0x3c.l+0x0a) leshort >3 (unknown OS)
  145. >>>(0x3c.l+0x10) lelong&0x28000 =0x8000 (DLL)
  146. >>>(0x3c.l+0x10) lelong&0x20000 >0 (device driver)
  147. >>>(0x3c.l+0x10) lelong&0x300 0x300 (GUI)
  148. >>>(0x3c.l+0x10) lelong&0x28300 <0x300 (console)
  149. >>>(0x3c.l+0x08) leshort 1 i80286
  150. >>>(0x3c.l+0x08) leshort 2 i80386
  151. >>>(0x3c.l+0x08) leshort 3 i80486
  152. >>>(8.s*16) string emx \b, emx
  153. >>>>&1 string x %s
  154. >>>&(&0x54.l-3) string arjsfx \b, ARJ self-extracting archive
  155. # MS Windows system file, supposedly a collection of LE executables
  156. >>(0x3c.l) string W3 \b, W3 for MS Windows
  157. >>(0x3c.l) string LE\0\0 \b, LE executable
  158. >>>(0x3c.l+0x0a) leshort 1
  159. # some DOS extenders use LE files with OS/2 header
  160. >>>>0x240 search/0x100 DOS/4G for MS-DOS, DOS4GW DOS extender
  161. >>>>0x240 search/0x200 WATCOM\ C/C++ for MS-DOS, DOS4GW DOS extender
  162. >>>>0x440 search/0x100 CauseWay\ DOS\ Extender for MS-DOS, CauseWay DOS extender
  163. >>>>0x40 search/0x40 PMODE/W for MS-DOS, PMODE/W DOS extender
  164. >>>>0x40 search/0x40 STUB/32A for MS-DOS, DOS/32A DOS extender (stub)
  165. >>>>0x40 search/0x80 STUB/32C for MS-DOS, DOS/32A DOS extender (configurable stub)
  166. >>>>0x40 search/0x80 DOS/32A for MS-DOS, DOS/32A DOS extender (embedded)
  167. # this is a wild guess; hopefully it is a specific signature
  168. >>>>&0x24 lelong <0x50
  169. >>>>>(&0x4c.l) string \xfc\xb8WATCOM
  170. >>>>>>&0 search/8 3\xdbf\xb9 \b, 32Lite compressed
  171. # another wild guess: if real OS/2 LE executables exist, they probably have higher start EIP
  172. #>>>>(0x3c.l+0x1c) lelong >0x10000 for OS/2
  173. # fails with DOS-Extenders.
  174. >>>(0x3c.l+0x0a) leshort 2 for MS Windows
  175. >>>(0x3c.l+0x0a) leshort 3 for DOS
  176. >>>(0x3c.l+0x0a) leshort 4 for MS Windows (VxD)
  177. >>>(&0x7c.l+0x26) string UPX \b, UPX compressed
  178. >>>&(&0x54.l-3) string UNACE \b, ACE self-extracting archive
  179. # looks like ASCII, probably some embedded copyright message.
  180. # and definitely not NE/LE/LX/PE
  181. >>0x3c lelong >0x20000000
  182. >>>(4.s*512) leshort !0x014c \b, MZ for MS-DOS
  183. # header data too small for extended executable
  184. >2 long !0
  185. >>0x18 leshort <0x40
  186. >>>(4.s*512) leshort !0x014c
  187. >>>>&(2.s-514) string !LE
  188. >>>>>&-2 string !BW \b, MZ for MS-DOS
  189. >>>>&(2.s-514) string LE \b, LE
  190. >>>>>0x240 search/0x100 DOS/4G for MS-DOS, DOS4GW DOS extender
  191. # educated guess since indirection is still not capable enough for complex offset
  192. # calculations (next embedded executable would be at &(&2*512+&0-2)
  193. # I suspect there are only LE executables in these multi-exe files
  194. >>>>&(2.s-514) string BW
  195. >>>>>0x240 search/0x100 DOS/4G ,\b LE for MS-DOS, DOS4GW DOS extender (embedded)
  196. >>>>>0x240 search/0x100 !DOS/4G ,\b BW collection for MS-DOS
  197. # This sequence skips to the first COFF segment, usually .text
  198. >(4.s*512) leshort 0x014c \b, COFF
  199. >>(8.s*16) string go32stub for MS-DOS, DJGPP go32 DOS extender
  200. >>(8.s*16) string emx
  201. >>>&1 string x for DOS, Win or OS/2, emx %s
  202. >>&(&0x42.l-3) byte x
  203. >>>&0x26 string UPX \b, UPX compressed
  204. # and yet another guess: small .text, and after large .data is unusal, could be 32lite
  205. >>&0x2c search/0xa0 .text
  206. >>>&0x0b lelong <0x2000
  207. >>>>&0 lelong >0x6000 \b, 32lite compressed
  208. >(8.s*16) string $WdX \b, WDos/X DOS extender
  209. # .EXE formats (Greg Roelofs, newt@uchicago.edu)
  210. #
  211. >0x35 string \x8e\xc0\xb9\x08\x00\xf3\xa5\x4a\x75\xeb\x8e\xc3\x8e\xd8\x33\xff\xbe\x30\x00\x05 \b, aPack compressed
  212. >0xe7 string LH/2\ Self-Extract \b, %s
  213. >0x1c string diet \b, diet compressed
  214. >0x1c string LZ09 \b, LZEXE v0.90 compressed
  215. >0x1c string LZ91 \b, LZEXE v0.91 compressed
  216. >0x1c string tz \b, TinyProg compressed
  217. >0x1e string PKLITE \b, %s compressed
  218. >0x64 string W\ Collis\0\0 \b, Compack compressed
  219. >0x24 string LHa's\ SFX \b, LHa self-extracting archive
  220. !:mime application/x-lha
  221. >0x24 string LHA's\ SFX \b, LHa self-extracting archive
  222. !:mime application/x-lha
  223. >0x24 string \ $ARX \b, ARX self-extracting archive
  224. >0x24 string \ $LHarc \b, LHarc self-extracting archive
  225. >0x20 string SFX\ by\ LARC \b, LARC self-extracting archive
  226. >1638 string -lh5- \b, LHa self-extracting archive v2.13S
  227. >0x17888 string Rar! \b, RAR self-extracting archive
  228. >0x40 string aPKG \b, aPackage self-extracting archive
  229. >32 string AIN
  230. >>35 string 2 \b, AIN 2.x compressed
  231. >>35 string <2 \b, AIN 1.x compressed
  232. >>35 string >2 \b, AIN 1.x compressed
  233. >28 string UC2X \b, UCEXE compressed
  234. >28 string WWP\ \b, WWPACK compressed
  235. # skip to the end of the exe
  236. >(4.s*512) long x
  237. >>&(2.s-517) byte x
  238. >>>&0 string PK\3\4 \b, ZIP self-extracting archive
  239. >>>&0 string Rar! \b, RAR self-extracting archive
  240. >>>&0 string =!\x11 \b, AIN 2.x self-extracting archive
  241. >>>&0 string =!\x12 \b, AIN 2.x self-extracting archive
  242. >>>&0 string =!\x17 \b, AIN 1.x self-extracting archive
  243. >>>&0 string =!\x18 \b, AIN 1.x self-extracting archive
  244. >>>&7 search/400 **ACE** \b, ACE self-extracting archive
  245. >>>&0 search/0x480 UC2SFX\ Header \b, UC2 self-extracting archive
  246. >0x1c string RJSX \b, ARJ self-extracting archive
  247. # winarj stores a message in the stub instead of the sig in the MZ header
  248. >0x20 search/0xe0 aRJsfX \b, ARJ self-extracting archive
  249. # a few unknown ZIP sfxes, no idea if they are needed or if they are
  250. # already captured by the generic patterns above
  251. >122 string Windows\ self-extracting\ ZIP \b, ZIP self-extracting archive
  252. >(8.s*16) search/0x20 PKSFX \b, ZIP self-extracting archive (PKZIP)
  253. # TODO: how to add this? >FileSize-34 string Windows\ Self-Installing\ Executable \b, ZIP self-extracting archive
  254. #
  255. # TELVOX Teleinformatica CODEC self-extractor for OS/2:
  256. >49801 string \x79\xff\x80\xff\x76\xff \b, CODEC archive v3.21
  257. >>49824 leshort =1 \b, 1 file
  258. >>49824 leshort >1 \b, %u files
  259. # .COM formats (Daniel Quinlan, quinlan@yggdrasil.com)
  260. # Uncommenting only the first two lines will cover about 2/3 of COM files,
  261. # but it isn't feasible to match all COM files since there must be at least
  262. # two dozen different one-byte "magics".
  263. # test too generic ?
  264. 0 byte 0xe9 DOS executable (COM)
  265. >0x1FE leshort 0xAA55 \b, boot code
  266. >6 string SFX\ of\ LHarc (%s)
  267. 0 belong 0xffffffff DOS executable (device driver)
  268. #CMD640X2.SYS
  269. >10 string >\x23
  270. >>10 string !\x2e
  271. >>>17 string <\x5B
  272. >>>>10 string x \b, name: %.8s
  273. #UDMA.SYS KEYB.SYS CMD640X2.SYS
  274. >10 string <\x41
  275. >>12 string >\x40
  276. >>>10 string !$
  277. >>>>12 string x \b, name: %.8s
  278. #BTCDROM.SYS ASPICD.SYS
  279. >22 string >\x40
  280. >>22 string <\x5B
  281. >>>23 string <\x5B
  282. >>>>22 string x \b, name: %.8s
  283. #ATAPICD.SYS
  284. >76 string \0
  285. >>77 string >\x40
  286. >>>77 string <\x5B
  287. >>>>77 string x \b, name: %.8s
  288. # test too generic ?
  289. 0 byte 0x8c DOS executable (COM)
  290. # updated by Joerg Jenderek at Oct 2008
  291. 0 ulelong 0xffff10eb DR-DOS executable (COM)
  292. # byte 0xeb conflicts with "sequent" magic leshort 0xn2eb
  293. 0 ubeshort&0xeb8d >0xeb00
  294. # DR-DOS STACKER.COM SCREATE.SYS missed
  295. >0 byte 0xeb DOS executable (COM)
  296. >>0x1FE leshort 0xAA55 \b, boot code
  297. >>85 string UPX \b, UPX compressed
  298. >>4 string \ $ARX \b, ARX self-extracting archive
  299. >>4 string \ $LHarc \b, LHarc self-extracting archive
  300. >>0x20e string SFX\ by\ LARC \b, LARC self-extracting archive
  301. # updated by Joerg Jenderek at Oct 2008
  302. #0 byte 0xb8 COM executable
  303. 0 uleshort&0x80ff 0x00b8
  304. # modified by Joerg Jenderek
  305. >1 lelong !0x21cd4cff COM executable for DOS
  306. # http://syslinux.zytor.com/comboot.php
  307. # (32-bit COMBOOT) programs *.C32 contain 32-bit code and run in flat-memory 32-bit protected mode
  308. # start with assembler instructions mov eax,21cd4cffh
  309. 0 uleshort&0xc0ff 0xc0b8
  310. >1 lelong 0x21cd4cff COM executable (32-bit COMBOOT)
  311. 0 string \x81\xfc
  312. >4 string \x77\x02\xcd\x20\xb9
  313. >>36 string UPX! FREE-DOS executable (COM), UPX compressed
  314. 252 string Must\ have\ DOS\ version DR-DOS executable (COM)
  315. # added by Joerg Jenderek at Oct 2008
  316. # GRR search is not working
  317. #34 search/2 UPX! FREE-DOS executable (COM), UPX compressed
  318. 34 string UPX! FREE-DOS executable (COM), UPX compressed
  319. 35 string UPX! FREE-DOS executable (COM), UPX compressed
  320. # GRR search is not working
  321. #2 search/28 \xcd\x21 COM executable for MS-DOS
  322. #WHICHFAT.cOM
  323. 2 string \xcd\x21 COM executable for DOS
  324. #DELTREE.cOM DELTREE2.cOM
  325. 4 string \xcd\x21 COM executable for DOS
  326. #IFMEMDSK.cOM ASSIGN.cOM COMP.cOM
  327. 5 string \xcd\x21 COM executable for DOS
  328. #DELTMP.COm HASFAT32.cOM
  329. 7 string \xcd\x21
  330. >0 byte !0xb8 COM executable for DOS
  331. #COMP.cOM MORE.COm
  332. 10 string \xcd\x21
  333. >5 string !\xcd\x21 COM executable for DOS
  334. #comecho.com
  335. 13 string \xcd\x21 COM executable for DOS
  336. #HELP.COm EDIT.coM
  337. 18 string \xcd\x21 COM executable for MS-DOS
  338. #NWRPLTRM.COm
  339. 23 string \xcd\x21 COM executable for MS-DOS
  340. #LOADFIX.cOm LOADFIX.cOm
  341. 30 string \xcd\x21 COM executable for MS-DOS
  342. #syslinux.com 3.11
  343. 70 string \xcd\x21 COM executable for DOS
  344. # many compressed/converted COMs start with a copy loop instead of a jump
  345. 0x6 search/0xa \xfc\x57\xf3\xa5\xc3 COM executable for MS-DOS
  346. 0x6 search/0xa \xfc\x57\xf3\xa4\xc3 COM executable for DOS
  347. >0x18 search/0x10 \x50\xa4\xff\xd5\x73 \b, aPack compressed
  348. 0x3c string W\ Collis\0\0 COM executable for MS-DOS, Compack compressed
  349. # FIXME: missing diet .com compression
  350. # miscellaneous formats
  351. 0 string LZ MS-DOS executable (built-in)
  352. #0 byte 0xf0 MS-DOS program library data
  353. #
  354. # AAF files:
  355. # <stuartc@rd.bbc.co.uk> Stuart Cunningham
  356. 0 string \320\317\021\340\241\261\032\341AAFB\015\000OM\006\016\053\064\001\001\001\377 AAF legacy file using MS Structured Storage
  357. >30 byte 9 (512B sectors)
  358. >30 byte 12 (4kB sectors)
  359. 0 string \320\317\021\340\241\261\032\341\001\002\001\015\000\002\000\000\006\016\053\064\003\002\001\001 AAF file using MS Structured Storage
  360. >30 byte 9 (512B sectors)
  361. >30 byte 12 (4kB sectors)
  362. # Popular applications
  363. 2080 string Microsoft\ Word\ 6.0\ Document %s
  364. !:mime application/msword
  365. 2080 string Documento\ Microsoft\ Word\ 6 Spanish Microsoft Word 6 document data
  366. !:mime application/msword
  367. # Pawel Wiecek <coven@i17linuxb.ists.pwr.wroc.pl> (for polish Word)
  368. 2112 string MSWordDoc Microsoft Word document data
  369. !:mime application/msword
  370. #
  371. 0 belong 0x31be0000 Microsoft Word Document
  372. !:mime application/msword
  373. #
  374. 0 string PO^Q` Microsoft Word 6.0 Document
  375. !:mime application/msword
  376. #
  377. 0 string \376\067\0\043 Microsoft Office Document
  378. !:mime application/msword
  379. 0 string \333\245-\0\0\0 Microsoft Office Document
  380. !:mime application/msword
  381. 512 string \354\245\301 Microsoft Word Document
  382. !:mime application/msword
  383. #
  384. 2080 string Microsoft\ Excel\ 5.0\ Worksheet %s
  385. !:mime application/vnd.ms-excel
  386. 2080 string Foglio\ di\ lavoro\ Microsoft\ Exce %s
  387. !:mime application/vnd.ms-excel
  388. #
  389. # Pawel Wiecek <coven@i17linuxb.ists.pwr.wroc.pl> (for polish Excel)
  390. 2114 string Biff5 Microsoft Excel 5.0 Worksheet
  391. !:mime application/vnd.ms-excel
  392. # Italian MS-Excel
  393. 2121 string Biff5 Microsoft Excel 5.0 Worksheet
  394. !:mime application/vnd.ms-excel
  395. 0 string \x09\x04\x06\x00\x00\x00\x10\x00 Microsoft Excel Worksheet
  396. !:mime application/vnd.ms-excel
  397. #
  398. 0 belong 0x00001a00 Lotus 1-2-3
  399. !:mime application/x-123
  400. >4 belong 0x00100400 wk3 document data
  401. >4 belong 0x02100400 wk4 document data
  402. >4 belong 0x07800100 fm3 or fmb document data
  403. >4 belong 0x07800000 fm3 or fmb document data
  404. #
  405. 0 belong 0x00000200 Lotus 1-2-3
  406. !:mime application/x-123
  407. >4 belong 0x06040600 wk1 document data
  408. >4 belong 0x06800200 fmt document data
  409. 0 string WordPro\0 Lotus WordPro
  410. !:mime application/vnd.lotus-wordpro
  411. 0 string WordPro\r\373 Lotus WordPro
  412. !:mime application/vnd.lotus-wordpro
  413. # Summary: Script used by InstallScield to uninstall applications
  414. # Extension: .isu
  415. # Submitted by: unknown
  416. # Modified by (1): Abel Cheung <abelcheung@gmail.com> (replace useless entry)
  417. 0 string \x71\xa8\x00\x00\x01\x02
  418. >12 string Stirling\ Technologies, InstallShield Uninstall Script
  419. # Winamp .avs
  420. #0 string Nullsoft\ AVS\ Preset\ \060\056\061\032 A plug in for Winamp ms-windows Freeware media player
  421. 0 string Nullsoft\ AVS\ Preset\ Winamp plug in
  422. # Windows Metafont .WMF
  423. 0 string \327\315\306\232 ms-windows metafont .wmf
  424. 0 string \002\000\011\000 ms-windows metafont .wmf
  425. 0 string \001\000\011\000 ms-windows metafont .wmf
  426. #tz3 files whatever that is (MS Works files)
  427. 0 string \003\001\001\004\070\001\000\000 tz3 ms-works file
  428. 0 string \003\002\001\004\070\001\000\000 tz3 ms-works file
  429. 0 string \003\003\001\004\070\001\000\000 tz3 ms-works file
  430. # PGP sig files .sig
  431. #0 string \211\000\077\003\005\000\063\237\127 065 to \027\266\151\064\005\045\101\233\021\002 PGP sig
  432. 0 string \211\000\077\003\005\000\063\237\127\065\027\266\151\064\005\045\101\233\021\002 PGP sig
  433. 0 string \211\000\077\003\005\000\063\237\127\066\027\266\151\064\005\045\101\233\021\002 PGP sig
  434. 0 string \211\000\077\003\005\000\063\237\127\067\027\266\151\064\005\045\101\233\021\002 PGP sig
  435. 0 string \211\000\077\003\005\000\063\237\127\070\027\266\151\064\005\045\101\233\021\002 PGP sig
  436. 0 string \211\000\077\003\005\000\063\237\127\071\027\266\151\064\005\045\101\233\021\002 PGP sig
  437. 0 string \211\000\225\003\005\000\062\122\207\304\100\345\042 PGP sig
  438. # windows zips files .dmf
  439. 0 string MDIF\032\000\010\000\000\000\372\046\100\175\001\000\001\036\001\000 MS Windows special zipped file
  440. #ico files
  441. 0 string \102\101\050\000\000\000\056\000\000\000\000\000\000\000 Icon for MS Windows
  442. # Windows icons (Ian Springer <ips@fpk.hp.com>)
  443. 0 string \000\000\001\000 MS Windows icon resource
  444. !:mime image/x-ico
  445. >4 byte 1 - 1 icon
  446. >4 byte >1 - %d icons
  447. >>6 byte >0 \b, %dx
  448. >>>7 byte >0 \b%d
  449. >>8 byte 0 \b, 256-colors
  450. >>8 byte >0 \b, %d-colors
  451. # .chr files
  452. 0 string PK\010\010BGI Borland font
  453. >4 string >\0 %s
  454. # then there is a copyright notice
  455. # .bgi files
  456. 0 string pk\010\010BGI Borland device
  457. >4 string >\0 %s
  458. # then there is a copyright notice
  459. # Windows Recycle Bin record file (named INFO2)
  460. # By Abel Cheung (abelcheung AT gmail dot com)
  461. # Version 4 always has 280 bytes (0x118) per record, version 5 has 800 bytes
  462. # Since Vista uses another structure, INFO2 structure probably won't change
  463. # anymore. Detailed analysis in:
  464. # http://www.cybersecurityinstitute.biz/downloads/INFO2.pdf
  465. 0 lelong 0x00000004
  466. >12 lelong 0x00000118 Windows Recycle Bin INFO2 file (Win98 or below)
  467. 0 lelong 0x00000005
  468. >12 lelong 0x00000320 Windows Recycle Bin INFO2 file (Win2k - WinXP)
  469. ##### put in Either Magic/font or Magic/news
  470. # Acroread or something files wrongly identified as G3 .pfm
  471. # these have the form \000 \001 any? \002 \000 \000
  472. # or \000 \001 any? \022 \000 \000
  473. #0 string \000\001 pfm?
  474. #>3 string \022\000\000Copyright\ yes
  475. #>3 string \002\000\000Copyright\ yes
  476. #>3 string >\0 oops, not a font file. Cancel that.
  477. #it clashes with ttf files so put it lower down.
  478. # From Doug Lee via a FreeBSD pr
  479. 9 string GERBILDOC First Choice document
  480. 9 string GERBILDB First Choice database
  481. 9 string GERBILCLIP First Choice database
  482. 0 string GERBIL First Choice device file
  483. 9 string RABBITGRAPH RabbitGraph file
  484. 0 string DCU1 Borland Delphi .DCU file
  485. 0 string =!<spell> MKS Spell hash list (old format)
  486. 0 string =!<spell2> MKS Spell hash list
  487. # Too simple - MPi
  488. #0 string AH Halo(TM) bitmapped font file
  489. 0 lelong 0x08086b70 TurboC BGI file
  490. 0 lelong 0x08084b50 TurboC Font file
  491. # WARNING: below line conflicts with Infocom game data Z-machine 3
  492. 0 byte 0x03 DBase 3 data file
  493. >0x04 lelong 0 (no records)
  494. >0x04 lelong >0 (%ld records)
  495. 0 byte 0x83 DBase 3 data file with memo(s)
  496. >0x04 lelong 0 (no records)
  497. >0x04 lelong >0 (%ld records)
  498. 0 leshort 0x0006 DBase 3 index file
  499. 0 string PMCC Windows 3.x .GRP file
  500. 1 string RDC-meg MegaDots
  501. >8 byte >0x2F version %c
  502. >9 byte >0x2F \b.%c file
  503. 0 lelong 0x4C
  504. >4 lelong 0x00021401 Windows shortcut file
  505. # DOS EPS Binary File Header
  506. # From: Ed Sznyter <ews@Black.Market.NET>
  507. 0 belong 0xC5D0D3C6 DOS EPS Binary File
  508. >4 long >0 Postscript starts at byte %d
  509. >>8 long >0 length %d
  510. >>>12 long >0 Metafile starts at byte %d
  511. >>>>16 long >0 length %d
  512. >>>20 long >0 TIFF starts at byte %d
  513. >>>>24 long >0 length %d
  514. # TNEF magic From "Joomy" <joomy@se-ed.net>
  515. # Microsoft Outlook's Transport Neutral Encapsulation Format (TNEF)
  516. 0 leshort 0x223e9f78 TNEF
  517. !:mime application/vnd.ms-tnef
  518. # HtmlHelp files (.chm)
  519. 0 string ITSF\003\000\000\000\x60\000\000\000\001\000\000\000 MS Windows HtmlHelp Data
  520. # GFA-BASIC (Wolfram Kleff)
  521. 2 string GFA-BASIC3 GFA-BASIC 3 data
  522. #------------------------------------------------------------------------------
  523. # From Stuart Caie <kyzer@4u.net> (developer of cabextract)
  524. # Microsoft Cabinet files
  525. 0 string MSCF\0\0\0\0 Microsoft Cabinet archive data
  526. !:mime application/vnd.ms-cab-compressed
  527. >8 lelong x \b, %u bytes
  528. >28 leshort 1 \b, 1 file
  529. >28 leshort >1 \b, %u files
  530. # InstallShield Cabinet files
  531. 0 string ISc( InstallShield Cabinet archive data
  532. >5 byte&0xf0 =0x60 version 6,
  533. >5 byte&0xf0 !0x60 version 4/5,
  534. >(12.l+40) lelong x %u files
  535. # Windows CE package files
  536. 0 string MSCE\0\0\0\0 Microsoft WinCE install header
  537. >20 lelong 0 \b, architecture-independent
  538. >20 lelong 103 \b, Hitachi SH3
  539. >20 lelong 104 \b, Hitachi SH4
  540. >20 lelong 0xA11 \b, StrongARM
  541. >20 lelong 4000 \b, MIPS R4000
  542. >20 lelong 10003 \b, Hitachi SH3
  543. >20 lelong 10004 \b, Hitachi SH3E
  544. >20 lelong 10005 \b, Hitachi SH4
  545. >20 lelong 70001 \b, ARM 7TDMI
  546. >52 leshort 1 \b, 1 file
  547. >52 leshort >1 \b, %u files
  548. >56 leshort 1 \b, 1 registry entry
  549. >56 leshort >1 \b, %u registry entries
  550. # Windows Enhanced Metafile (EMF)
  551. # See msdn.microsoft.com/archive/en-us/dnargdi/html/msdn_enhmeta.asp
  552. # for further information.
  553. 0 ulelong 1
  554. >40 string \ EMF Windows Enhanced Metafile (EMF) image data
  555. >>44 ulelong x version 0x%x
  556. # From: Alex Beregszaszi <alex@fsn.hu>
  557. 0 string COWD VMWare3
  558. >4 byte 3 disk image
  559. >>32 lelong x (%d/
  560. >>36 lelong x \b%d/
  561. >>40 lelong x \b%d)
  562. >4 byte 2 undoable disk image
  563. >>32 string >\0 (%s)
  564. 0 string VMDK VMware4 disk image
  565. 0 string KDMV VMware4 disk image
  566. #--------------------------------------------------------------------
  567. # Qemu Emulator Images
  568. # Lines written by Friedrich Schwittay (f.schwittay@yousable.de)
  569. # Made by reading sources and doing trial and error on existing
  570. # qcow files
  571. 0 string QFI Qemu Image, Format: Qcow
  572. # Uncomment the following line to display Magic (only used for debugging
  573. # this magic number)
  574. #>0 string x , Magic: %s
  575. # There are currently 2 Versions: "1" and "2"
  576. # I do not use Version 2 and therefor branch here
  577. # but can assure: it works (tested on both versions)
  578. # Also my Qemu 0.9.0 which uses this Version 2 refuses
  579. # to start in its bios
  580. >0x04 belong 2 , Version: 2
  581. >0x04 belong 1 , Version: 1
  582. # Using the existence of the Backing File Offset to Branch or not
  583. # to read Backing File Information
  584. >>0xc belong >0 , Backing File( Offset: %lu
  585. >>>(0xc.L) string >\0 , Path: %s
  586. # Didn't get the trick here how qemu stores the "Size" at this Position
  587. # There is actually something stored but nothing makes sense
  588. # The header in the sources talks about it
  589. #>>>16 lelong x , Size: %lu
  590. # Modification time of the Backing File
  591. # Really useful if you want to know if your backing
  592. # file is still usable together with this image
  593. >>>20 bedate x , Mtime: %s )
  594. # Don't know how to calculate in Magicfiles
  595. # Also: this Information is not reliably
  596. # stored in image-files
  597. >>24 lelong x , Disk Size could be: %d * 256 bytes
  598. 0 string QEVM QEMU's suspend to disk image
  599. 0 string Bochs\ Virtual\ HD\ Image Bochs disk image,
  600. >32 string x type %s,
  601. >48 string x subtype %s
  602. 0 lelong 0x02468ace Bochs Sparse disk image
  603. # from http://filext.com by Derek M Jones <derek@knosof.co.uk>
  604. # False positive with PPT (also currently this string is too long)
  605. #0 string \xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x3E\x00\x03\x00\xFE\xFF\x09\x00\x06 Microsoft Installer
  606. 0 string \320\317\021\340\241\261\032\341 Microsoft Office Document
  607. #>48 byte 0x1B Excel Document
  608. #!:mime application/vnd.ms-excel
  609. >546 string bjbj Microsoft Word Document
  610. !:mime application/msword
  611. >546 string jbjb Microsoft Word Document
  612. !:mime application/msword
  613. 0 string \224\246\056 Microsoft Word Document
  614. !:mime application/msword
  615. 512 string R\0o\0o\0t\0\ \0E\0n\0t\0r\0y Microsoft Word Document
  616. !:mime application/msword
  617. # From: "Nelson A. de Oliveira" <naoliv@gmail.com>
  618. # Magic type for Dell's BIOS .hdr files
  619. # Dell's .hdr
  620. 0 string $RBU
  621. >23 string Dell %s system BIOS
  622. >48 string x version %.3s
  623. # Type: Microsoft DirectDraw Surface
  624. # URL: http://msdn.microsoft.com/library/default.asp?url=/library/en-us/directx9_c/directx/graphics/reference/DDSFileReference/ddsfileformat.asp
  625. # From: Morten Hustveit <morten@debian.org>
  626. 0 string DDS\040\174\000\000\000 Microsoft DirectDraw Surface (DDS),
  627. >16 lelong >0 %hd x
  628. >12 lelong >0 %hd,
  629. >84 string x %.4s
  630. # Type: Microsoft Document Imaging Format (.mdi)
  631. # URL: http://en.wikipedia.org/wiki/Microsoft_Document_Imaging_Format
  632. # From: Daniele Sempione <scrows@oziosi.org>
  633. 0 short 0x5045 Microsoft Document Imaging Format
  634. # MS eBook format (.lit)
  635. 0 string ITOLITLS Microsoft Reader eBook Data
  636. >8 lelong x \b, version %u
  637. !:mime application/x-ms-reader