opnsense-src/contrib/file/magic/Magdir/msdos
Xin LI 71c92e6b94 MFC: MFV: file 5.46.
(cherry picked from commit ae316d1d1c)
2024-12-21 23:37:20 -08:00

3073 lines
125 KiB
Text
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

#------------------------------------------------------------------------------
# $File: msdos,v 1.208 2024/08/27 18:50:57 christos Exp $
# msdos: file(1) magic for MS-DOS files
#
# .BAT files (Daniel Quinlan, quinlan@yggdrasil.com)
# updated by Joerg Jenderek at Oct 2008,Apr 2011
0 string/t @
>1 string/cW \ echo\ off DOS batch file text
!:mime text/x-msdos-batch
!:ext bat
>1 string/cW echo\ off DOS batch file text
!:mime text/x-msdos-batch
!:ext bat
>1 string/cW rem DOS batch file text
!:mime text/x-msdos-batch
!:ext bat
>1 string/cW set\ DOS batch file text
!:mime text/x-msdos-batch
!:ext bat
# OS/2 batch files are REXX. the second regex is a bit generic, oh well
# the matched commands seem to be common in REXX and uncommon elsewhere
100 search/0xffff rxfuncadd
>100 regex/c =^[\ \t]{0,10}call[\ \t]{1,10}rxfunc OS/2 REXX batch file text
100 search/0xffff say
>100 regex/c =^[\ \t]{0,10}say\ ['"] OS/2 REXX batch file text
# Tests for various EXE types.
#
# Many of the compressed formats were extracted from IDARC 1.23 source code.
#
# e_magic
0 string/b MZ
# TODO
# FLT: Syntrillium CoolEdit Filter https://en.wikipedia.org/wiki/Adobe_Audition
# FMX64:FileMaker Pro 64-bit plug-in https://en.wikipedia.org/wiki/FileMaker
# FMX: FileMaker Pro 32-bit plug-in https://en.wikipedia.org/wiki/FileMaker
# FOD: WIFE Font Driver
# GAU: MS Flight Simulator Gauge
# IFS: OS/2 Installable File System https://en.wikipedia.org/wiki/OS/2
# MEXW32:MATLAB Windows 32bit compiled function https://en.wikipedia.org/wiki/MATLAB
# MEXW64:MATLAB Windows 64bit compiled function https://en.wikipedia.org/wiki/MATLAB
# MLL: Maya plug-in (generic) http://en.wikipedia.org/wiki/Autodesk_Maya
# PFL: PhotoFilter plugin http://photofiltre.free.fr
# 8*: PhotoShop plug-in (generic) http://www.adobe.com/products/photoshop/main.html
# PLG: Aston Shell plugin http://www.astonshell.com/
# QLB: Microsoft Basic Quick library https://en.wikipedia.org/wiki/QuickBASIC
# SKL: WinLIFT skin http://www.zapsolution.com/winlift/index.htm
# TBK: Asymetrix ToolBook application http://www.toolbook.com
# TBP: The Bat! plugin http://www.ritlabs.com
# UPC: Ultimate Paint Graphics Editor plugin http://ultimatepaint.j-t-l.com
# XFM: Syntrillium Cool Edit Transform Effect bad http://www.cooledit.com
# XPL: X-Plane plugin http://www.xsquawkbox.net/xpsdk/
# ZAP: ZoneLabs Zone Alarm data http://www.zonelabs.com
#
# NEXT LINES FOR DEBUGGING!
# e_cblp; bytes on last page of file
# e_cp; pages in file
#>4 uleshort x \b, e_cp 0x%x
# e_lfanew; file address of new exe header
#>0x3c ulelong x \b, e_lfanew 0x%x
# e_lfarlc; address of relocation table
#>0x18 uleshort x \b, e_lfarlc=0x%x
# e_ovno; overlay number. If zero, this is the main executable foo
#>0x1a uleshort !0 \b, e_ovno 0x%x
#>0x1C ubequad !0 \b, e_res 0x%16.16llx
# e_oemid; often 0
#>0x24 uleshort !0 \b, e_oemid 0x%x
# e_oeminfo; typically zeroes, but 13Dh (WORDSTAR.CNV WPFT5.CNV) 143h (WRITWIN.CNV)
# 1A3h (DBASE.CNV LOTUS123.CNV RFTDCA.CNV WORDDOS.CNV WORDMAC.CNV WORDWIN1.CNVXLBIFF.CNV)
#>0x26 uleshort !0 \b, e_oeminfo 0x%x
# e_res2; typically zeroes, but 000006006F082D2Ah SCSICFG.EXE 00009A0300007C03h de.exe
# 0000CA0000000002h country.exe dosxmgr.exe 421E0A00421EA823h QMC.EXE
#>0x28 ubequad !0 \b, e_res2 0x%16.16llx
# https://web.archive.org/web/20171116024937/http://www.ctyme.com/intr/rb-2939.htm#table1593
# https://github.com/uxmal/reko/blob/master/src/ImageLoaders/MzExe/ExeImageLoader.cs
# new exe header magic like: PE NE LE LX W3 W4
# no examples found for ZM DL MP P2 P3
#>(0x3c.l) string x \b, at [0x3c] %.2s
#>(0x3c.l) ubelong x \b, at [0x3c] %#8.8x
#>(0x3c.l+4) ubelong x \b, at [0x3c+4] %#8.8x
#
# Most non-DOS MZ-executable extensions have the relocation table more than 0x40 bytes into the file.
# http://www.mitec.cz/Downloads/EXE.zip/EXE64.exe e_lfarlc=0x8ead
# OS/2 ECS\INSTALL\DETECTEI\PCISCAN.EXE e_lfarlc=0x1c
# some EFI apps Shell_Full.efi ext4_x64_signed.efi e_lfarlc=0
# Icon library WORD60.ICL e_lfarlc=0
# Microsoft compiled help format 2.0 WINWORD.DEV.HXS e_lfarlc=0
>0x18 uleshort <0x40
# check magic of new second header
# skip Portable Executable (PE) with low e_lfarlc here, because handled later
# like: ext4_x64_signed.efi Shell_Full.efi WINWORD.DEV.HXS
>>(0x3c.l) string !PE\0\0 MS-DOS executable
# NE executable with low e_lfarlc like: WORD60.ICL
# This is Icon Manager (IM) by Impact Software format, based on NE version 5 with cleared NE version and e_lfarlc fields
# It can be parsed/loaded as NE version 5 binary just by skipping e_lfarlc and NE version checks
# ICL: Icons Library 16-bit http://fileformats.archiveteam.org/wiki/Icon_library
>>(0x3c.l-0x02) string IMNE \b, NE
>>>(0x3c.l+0x02) ubyte x \b version %u
>>>(0x3c.l+0x36) byte 2 for MS Windows
>>>>(0x3c.l+0x3E) ushort !0
>>>>>(0x3c.l+0x3F) ubyte x %u
>>>>>(0x3c.l+0x3E) ubyte x \b.%02u
>>>(0x3c.l+0x02) ubyte x (Icon Library, Icon Manager by Impact Software)
!:ext icl
# handle LX executable with low e_lfarlc like: PCISCAN.EXE
>>(0x3c.l) string LX \b, LX
>>>(0x3c.l+0x2) uleshort =0x0000
>>>>(0x3c.l) use lx-executable
# no examples found for big endian variant
>>>(0x3c.l+0x2) uleshort =0x0101
>>>>(0x3c.l) use \^lx-executable
# no examples found for PDP-11 endian variant
>>>(0x3c.l+0x2) uleshort =0x0100
# PDP-11-endian is not supported by magic "use" keyword yet
# no examples found for other endian variants
>>>0 default x
# other endianity is not supported by magic "use" keyword
# Maybe it's a PE?
# URL: http://fileformats.archiveteam.org/wiki/Portable_Executable
# Reference: https://docs.microsoft.com/de-de/windows/win32/debug/pe-format
>(0x3c.l) string PE\0\0 PE
!:mime application/vnd.microsoft.portable-executable
# https://docs.microsoft.com/de-de/windows/win32/debug/pe-format#characteristics
# DLL Characteristics
#>>(0x3c.l+22) uleshort x \b, CHARACTERISTICS %#4.4x,
# 0x0200~IMAGE_FILE_DEBUG_STRIPPED Debugging information is removed from the image file
# 0x1000~IMAGE_FILE_SYSTEM The image file is a system file, not a user program.
# 0x2000~IMAGE_FILE_DLL The image file is a dynamic-link library (DLL)
>>(0x3c.l+24) leshort 0x010b \b32 executable
# https://learn.microsoft.com/en-us/windows/win32/debug/pe-format#windows-subsystem
#>>>(0x3c.l+92) leshort x \b, SUBSYSTEM %u
>>(0x3c.l+24) leshort 0x020b \b32+ executable
#>>>(0x3c.l+92) leshort x \b, SUBSYSTEM %u
# ROM image is without DOS MZ header and without PE\0\0 signature
#>>(0x3c.l+24) leshort 0x0107 ROM image
>>(0x3c.l+24) default x with unknown signature
>>>&0 leshort x %#x
## Start of the subsystem switch
>>(0x3c.l+92) clear x
# 0~IMAGE_SUBSYSTEM_UNKNOWN An unknown subsystem
>>(0x3c.l+92) leshort 0
# WINE https://www.winehq.org/ DLL libraries without subsystem, some examples:
# fakedlls/l3codeca.acm fakedlls/msadp32.acm fakedlls/inetcpl.cpl fakedlls/inetcpl.cpl fakedlls/kernel32.dll fakedlls/user32.dll fakedlls/gdi32.dll
# fakedlls/winex11.drv fakedlls/winspool.drv fakedlls/gphoto2.ds fakedlls/sane.ds fakedlls/ntoskrnl.exe fakedlls/dhtmled.ocx fakedlls/hhctrl.ocx
# fakedlls/hidclass.sys fakedlls/mshtml.tlb fakedlls/stdole32.tlb fakedlls/vwin32.vxd fakedlls/vmm.vxd
>>>0x40 string Wine\ placeholder\ DLL for WINE stub (DLL)
!:ext acm/cpl/dll/drv/ds/exe/ocx/sys/tlb/vxd
>>>0x40 string Wine\ builtin\ DLL for WINE (DLL)
!:ext acm/cpl/dll/drv/ds/exe/ocx/sys/tlb/vxd
>>>0 default x
# Summary: Microsoft compiled help *.HXS format 2.0
# URL: https://en.wikipedia.org/wiki/Microsoft_Help_2
# Reference: http://www.russotto.net/chm/itolitlsformat.html
# https://mark0.net/download/triddefs_xml.7z/defs/h/hxs.trid.xml
# Note: Microsoft compiled help format contains 2 PE32 sections (.rsrc, .its) for Intel i386;
# The help content is appended after the PE32 binary and starts with ITOLITLS string;
# End of the PE32 binary is immediately after the .its section.
# verified by command like:
# `pelook.exe -d WINWORD.HXS & pelook.exe -h WINWORD.HXS`
# `objdump -p -s WINWORD.HXS`
# `readpe WINWORD.HXS`
>>>>(0x3c.l+6) uleshort =2
# Second section for these binaries starts at fixed offset 288 (size of PE signature + size of COFF header + size
# of PE32 optional header with all data dirs + size of first .rsrc section header = 4 + 20 + 96+8*16 + 40 = 288)
>>>>>(0x3c.l+288) string/b .its\0\0\0\0
# Read start+length of .its section and just after it
>>>>>>(&4.l+(-4)) string ITOLITLS \b, Microsoft compiled help format 2.0
!:ext hxs
# Fallback for any unrecognized binary with Unknown subsystem 0
>>>>>>0 default x for Unknown subsystem 0
>>>>>0 default x for Unknown subsystem 0
>>>>0 default x for Unknown subsystem 0
# 1~IMAGE_SUBSYSTEM_NATIVE device drivers and native Windows processes
>>(0x3c.l+92) leshort 1
# WINE https://www.winehq.org/: fakedlls/fltmgr.sys fakedlls/mountmgr.sys fakedlls/scsiport.sys fakedlls/winebus.sys fakedlls/winehid.sys
>>>0x40 string Wine\ placeholder\ DLL for WINE stub
>>>0x40 string Wine\ builtin\ DLL for WINE
>>>0 default x for MS Windows
>>>>(0x3c.l+72) leshort x %u
>>>>(0x3c.l+74) leshort x \b.%02u
# Native PEs are used by:
# - NT kernel DLLs: hal.dll, kdcom.dll, pshed.dll, bootvid.dll, ...
# - NT kernel images: ntoskrnl.exe, ntkrnlmp.exe, ntkrnlpa.exe, ntkrpamp.exe
# - NT kernel drivers: Windows/System32/drivers/*.sys
# - NT native userspace DLLs: ntdll.dll, ...
# - NT native userspace executables: smss.exe, csrss.exe, autochk.exe, ...
# TODO: write rule to distinguish between Kernel and Native processes
# (the only way to do this is based on the presence of ntoskrnl.exe in import table)
>>>(0x3c.l+22) leshort&0x2000 >0 (native)
!:ext dll/sys
>>>(0x3c.l+22) leshort&0x2000 0 (native)
!:ext exe/sys
# 2~IMAGE_SUBSYSTEM_WINDOWS_GUI The Windows graphical user interface (GUI) subsystem
>>(0x3c.l+92) leshort 2
# WINE https://www.winehq.org/: fakedlls/clock.exe fakedlls/control.exe fakedlls/explorer.exe fakedlls/notepad.exe
>>>0x40 string Wine\ placeholder\ DLL for WINE stub
>>>0x40 string Wine\ builtin\ DLL for WINE
>>>0 default x for MS Windows
>>>>(0x3c.l+72) leshort x %u
>>>>(0x3c.l+74) leshort x \b.%02u
>>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
# These could probably be at least partially distinguished from one another by
# looking for specific exported functions.
# CPL: Control Panel item
# TLB: Type library
# OCX: OLE/ActiveX control
# ACM: Audio compression manager codec
# AX: DirectShow source filter
# IME: Input method editor
!:ext dll/cpl/tlb/ocx/acm/ax/ime
>>>(0x3c.l+22) leshort&0x2000 0 (GUI)
# Screen savers typically include code from the scrnsave.lib static library, but
# that's not guaranteed.
!:ext exe/scr
# 3~IMAGE_SUBSYSTEM_WINDOWS_CUI The Windows character subsystem
>>(0x3c.l+92) leshort 3
# WINE https://www.winehq.org/: fakedlls/cacls.exe fakedlls/cmd.exe fakedlls/expand.exe fakedlls/net.exe fakedlls/reg.exe
>>>0x40 string Wine\ placeholder\ DLL for WINE stub
>>>0x40 string Wine\ builtin\ DLL for WINE
>>>0 default x for MS Windows
>>>>(0x3c.l+72) leshort x %u
>>>>(0x3c.l+74) leshort x \b.%02u
>>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
!:ext dll/cpl/tlb/ocx/acm/ax/ime
>>>(0x3c.l+22) leshort&0x2000 0 (console)
!:ext exe/com
# 4~Old Windows CE subsystem (never used)
#>>(0x3c.l+92) leshort 4 for MS Windows CE OLD
# 5~IMAGE_SUBSYSTEM_OS2_CUI The OS/2 character subsystem
# Not used in image files, constant used only in in-memory structures of OS/2 subsystem as part of Windows NT
#>>(0x3c.l+92) leshort 5 for OS/2
# NO Windows Subsystem number 6!
#>>(0x3c.l+92) leshort 6 for Unknown subsystem 6
# 7~IMAGE_SUBSYSTEM_POSIX_CUI The Posix character subsystem
>>(0x3c.l+92) leshort 7 for POSIX
>>>(0x3c.l+72) leshort x %u
>>>(0x3c.l+74) leshort x \b.%02u
>>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
# like: PSXDLL.DLL
!:ext dll
>>>(0x3c.l+22) leshort&0x2000 0 (EXE)
# like: PAX.EXE
!:ext exe
# 8~IMAGE_SUBSYSTEM_NATIVE_WINDOWS Native Win9x driver
# Win9x never used subsystem 8, all Win9x drivers are either LE/VXD or PE with native (1) subsystem
# MSVC4 LINK.EXE can create PE binary for subsystem 8 by /SUBSYSTEM:MMOSA flag
# MMOSA refers to Native Win32E (embedded) API, mentioned at:
# https://www.microsoft.com/en-us/research/wp-content/uploads/2016/02/tr-97-18.doc
#>>(0x3c.l+92) leshort 8 for Win9x/MMOSA
# GRR: No examples found by Joerg Jenderek
# 9~IMAGE_SUBSYSTEM_WINDOWS_CE_GUI Windows CE
>>(0x3c.l+92) leshort 9
# WINE https://www.winehq.org/
>>>0x40 string Wine\ placeholder\ DLL for WINE stub
>>>0x40 string Wine\ builtin\ DLL for WINE
>>>0 default x for MS Windows CE
>>>>(0x3c.l+72) leshort x %u
>>>>(0x3c.l+74) leshort x \b.%02u
>>>(0x3c.l+22) leshort&0x2000 >0 (DLL)
# like: MCS9900Ce50.dll Mosiisr99x.dll TMCGPS.DLL
!:ext dll
>>>(0x3c.l+22) leshort&0x2000 0 (EXE)
# like: NNGStart.exe navigator.exe
!:ext exe
# 10~IMAGE_SUBSYSTEM_EFI_APPLICATION An Extensible Firmware Interface (EFI) application
>>(0x3c.l+92) leshort 10 for EFI (application)
# like: bootmgfw.efi grub.efi gdisk_x64.efi Shell_Full.efi shim.efi syslinux.efi
!:ext efi
# 11~IMAGE_SUBSYSTEM_EFI_BOOT_SERVICE_DRIVER An EFI driver with boot services
>>(0x3c.l+92) leshort 11 for EFI (boot service driver)
# like: ext2_x64_signed.efi Fat_x64.efi iso9660_x64_signed.efi
!:ext efi
# 12~IMAGE_SUBSYSTEM_EFI_RUNTIME_DRIVER An EFI driver with run-time services
>>(0x3c.l+92) leshort 12 for EFI (runtime driver)
# no sample found
!:ext efi
# 13~IMAGE_SUBSYSTEM_EFI_ROM An EFI ROM image
>>(0x3c.l+92) leshort 13 for EFI (ROM)
# no sample found
!:ext efi
# 14~IMAGE_SUBSYSTEM_XBOX XBOX
>>(0x3c.l+92) leshort 14 for XBOX
#!:ext foo-xbox
# NO Windows Subsystem number 15!
#>>(0x3c.l+92) leshort 15 for Unknown subsystem 15
# 16~IMAGE_SUBSYSTEM_WINDOWS_BOOT_APPLICATION Windows boot application
>>(0x3c.l+92) leshort 16 for MS Windows
>>>(0x3c.l+72) leshort x %u
>>>(0x3c.l+74) leshort x \b.%02u
>>>(0x3c.l+22) leshort&0x2000 >0 (boot DLL)
# like: bootvhd.dll bootuwf.dll hvloader.dll tcbloader.dll bootspaces.dll
!:ext dll
>>>(0x3c.l+22) leshort&0x2000 0 (boot application)
# like: bootmgr.efi memtest.efi shellx64.efi memtest.exe winload.exe winresume.exe bootvhd.dll hvloader.dll
!:ext efi/exe
>>(0x3c.l+92) default x
>>>&0 leshort x for Unknown subsystem %#x
## End of the subsystem switch
>>(0x3c.l+4) clear x \b,
>>(0x3c.l+4) use display-coff-processor
>>(0x3c.l+22) leshort&0x0200 >0 (stripped to external PDB)
>>(0x3c.l+22) leshort&0x1000 >0 system file
# Check for presence of COM Runtime descriptor
>>(0x3c.l+24) leshort 0x010b
>>>(0x3c.l+116) leshort >14
>>>>(0x3c.l+232) lelong >0 Mono/.Net assembly
>>(0x3c.l+24) leshort 0x020b
>>>(0x3c.l+132) leshort >14
>>>>(0x3c.l+248) lelong >0 Mono/.Net assembly
# hooray, there's a DOS extender using the PE format, with a valid PE
# executable inside (which just prints a message and exits if run in win)
# FIXME: Find sample of such executable for investigation. In was introduced
# in file version 4.14 with following check:
# "(8.s*16) string 32STUB for MS-DOS, 32rtm DOS extender"
# "(8.s*16) string !32STUB for MS Windows"
# But that check is too generic and had lot of false positives. 32STUB/32rtm
# sounds like Borland DOS extender with PE loader and Windows emulation which
# can be injected into any valid Windows PE binary.
# So it is needed to look at the sample of such executable and check for
# subsystem or cpu/machine.
# Detect embedded DOS extenders
>>(8.s*16) string 32STUB
# BRC32.EXE, TLINK32.EXE or TASM32.EXE from TASM 5.0
>>>(8.s*16) search/0x50 32rtm-stub\ for\ PE\ files \b, Borland 32rtm DOS extender (stub)
# CL.EXE or LINK.EXE from MS Visual C++ 1.x
>>(8.s*16) search/0x50 Phar\ Lap\ Software,\ Inc. \b, Phar Lap TNT DOS extender
# ulink.exe
>>(8.s*16) search/0x200 Can't\ find\ DOSWIN32.RTM \b, DosWin32 DOS extender (stub)
>>(8.s*16) search/0x4000 Stub\ failed\ to\ find\ DOS/4G\ extender. \b, DOS/4G DOS extender (stub)
# LOADPEX.BIN and HDLD32.BIN
# x86 jmp near relative (0xe9 0x?? 0x??) + string "MI" (0x4d 0x49)
>>(8.s*16) ulequad&0xffff0000ff =0x494d0000e9 \b, HX DOS extender (embedded with DPMI host)
>>(8.s*16) ulequad&0xffff0000ff !0x494d0000e9
# DPMIST32.BIN
>>>(8.s*16) search/0x200 cannot\ find\ loader\ DPMILD32.EXE \b, HX DOS extender (stub)
# LOADPE.BIN
>>>(8.s*16) search/0x600 PATH=HDPMI32.EXE \b, HX DOS extender (embedded without DPMI host)
# DPMILD32.BIN
>>>(8.s*16) search/0x4000 DPMILD32: \b, HX DOS extender (embedded without DPMI host)
>>(0x3c.l+0xf8) string UPX0 \b, UPX compressed
>>(0x3c.l+0xf8) search/0x140 PEC2 \b, PECompact2 compressed
>>(0x3c.l+0xf8) search/0x140 UPX2
>>>(&0x10.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
>>(0x3c.l+0xf8) search/0x140 .idata
>>>(&0xe.l+(-4)) string PK\3\4 \b, ZIP self-extracting archive (Info-Zip)
>>>(&0xe.l+(-4)) string ZZ0 \b, ZZip self-extracting archive
>>>(&0xe.l+(-4)) string ZZ1 \b, ZZip self-extracting archive
>>(0x3c.l+0xf8) search/0x140 .rsrc
>>>(&0x0f.l+(-4)) string a\\\4\5 \b, WinHKI self-extracting archive
>>>(&0x0f.l+(-4)) string Rar! \b, RAR self-extracting archive
>>>(&0x0f.l+(-4)) search/0x3000 MSCF \b, InstallShield self-extracting archive
>>>(&0x0f.l+(-4)) search/32 Nullsoft \b, Nullsoft Installer self-extracting archive
>>(0x3c.l+0xf8) search/0x140 .data
>>>(&0x0f.l) string WEXTRACT \b, MS CAB-Installer self-extracting archive
>>(0x3c.l+0xf8) search/0x140 .petite\0 \b, Petite compressed
>>>(0x3c.l+0xf7) byte x
>>>>(&0x104.l+(-4)) string =!sfx! \b, ACE self-extracting archive
>>(0x3c.l+0xf8) search/0x140 .WISE \b, WISE installer self-extracting archive
>>(0x3c.l+0xf8) search/0x140 .dz\0\0\0 \b, Dzip self-extracting archive
>>&(0x3c.l+0xf8) search/0x100 _winzip_ \b, ZIP self-extracting archive (WinZip)
>>&(0x3c.l+0xf8) search/0x100 SharedD \b, Microsoft Installer self-extracting archive
>>0x30 string Inno \b, InnoSetup self-extracting archive
# NumberOfSections; Normal Dynamic Link libraries have a few sections for code, data and resource etc.
# PE used as container have less sections
>>(0x3c.l+6) leshort >1 \b, %u sections
# do not display for 1 section to get output like in version 5.43 and to keep output columns low
#>>(0x3c.l+6) leshort =1 \b, %u section
# If the relocation table is 0x40 or more bytes into the file, it's definitely
# not a DOS EXE.
>0x18 uleshort >0x3f
# Hmm, not a PE but the relocation table is too high for a traditional DOS exe,
# must be one of the unusual subformats.
>>(0x3c.l) string !PE\0\0 MS-DOS executable
#!:mime application/x-dosexec
>>(0x3c.l) string NE \b, NE
#!:mime application/x-dosexec
!:mime application/x-ms-ne-executable
>>>(0x3c.l+0x02) ubyte x \b version %u
>>>(0x3c.l+0x02) ubyte >5
>>>>(0x3c.l+0x03) ubyte x \b.%02u
# FOR DEBUGGING!
# Reference: https://wiki.osdev.org/NE
# Create time for NE version <5 in FAT12 format
#>>>(0x3c.l+0x02) ubyte <5
#>>>>(0x3c.l+0x08) ulelong !0 \b, Created at
#>>>>>(0x3c.l+0x0a) lemsdosdate x %s
#>>>>>(0x3c.l+0x08) lemsdostime x %s
# ProgFlags; Program flags, bitmapped
#>>>(0x3c.l+0x0C) ubyte x \b, ProgFlags 0x%2.2x
# >>>(0x3c.l+0x0c) ubyte&0x03 =0 \b, no automatic data segment
# >>>(0x3c.l+0x0c) ubyte&0x03 =1 \b, single shared
# >>>(0x3c.l+0x0c) ubyte&0x03 =2 \b, multiple
# >>>(0x3c.l+0x0c) ubyte&0x03 =3 \b, (null)
# >>>(0x3c.l+0x0c) ubyte &0x04 \b, Per-Process Library Initialization OR real mode only
# >>>(0x3c.l+0x0c) ubyte &0x08 \b, Protected mode only
# >>>(0x3c.l+0x0c) ubyte &0x10 \b, 8086 instructions in OS/2 app OR LIM 3.2 EMS API in Win app
# >>>(0x3c.l+0x0c) ubyte &0x20 \b, i286 instructions in OS/2 app OR each instance in separate EMS bank in Win app
# >>>(0x3c.l+0x0c) ubyte &0x40 \b, i386 instructions in OS/2 app OR private GlobalAlloc above the EMS line in Win app
# >>>(0x3c.l+0x0c) ubyte &0x80 \b, x87 floating point instructions
# ApplFlags; Application flags, bitmapped
# https://www.fileformat.info/format/exe/corion-ne.htm
#>>>(0x3c.l+0x0D) ubyte x \b, ApplFlags 0x%2.2x
# Application type (bits 0-2); 1~Full screen (not aware of Windows/P.M. API)
# 2~Compatible with Windows/P.M. API 3~Uses Windows/P.M. API
#>>>(0x3c.l+0x0D) ubyte&0x07 =1 \b, Not compatiblr with Windows/P.M. API (full screen)
#>>>(0x3c.l+0x0D) ubyte&0x07 =2 \b, Compatible with Windows/P.M. API (console mode)
#>>>(0x3c.l+0x0D) ubyte&0x07 =3 \b, use Windows/P.M. API (window mode)
#>>>(0x3c.l+0x0D) ubyte &0x08 \b, Bound OS/2 app OR application specific loader in Win app
#>>>(0x3c.l+0x0D) ubyte &0x20 \b, Errors in image
#>>>(0x3c.l+0x0D) ubyte &0x40 \b, Non-conforming OS/2 app OR private Win library above EMS line
# bit 7; DLL or driver (SS:SP info invalid, CS:IP points at FAR init routine called with AX handle
#>>>(0x3c.l+0x0D) ubyte &0x80 \b, DLL or driver
# AutoDataSegIndex; automatic data segment index like: 0 2 3 22
# zero if the SINGLEDATA and MULTIPLEDATA bits are cleared
#>>>(0x3c.l+0x0e) uleshort x \b, AutoDataSegIndex %u
# InitHeapSize; intial local heap size like; 0 400h 1400h
# zero if there is no local allocation
#>>>(0x3c.l+0x10) uleshort !0 \b, InitHeapSize 0x%x
# InitStackSize; inital stack size like: 0 10h A00h 7D0h A8Ch FA0h 1000h 1388h
# 1400h (CBT) 1800h 2000h 2800h 2EE0h 2F3Ch 3258h 3E80h 4000h 4E20h 5000h 6000h
# 6D60h 8000h 40000h
# zero if the SS register value does not equal the DS register value
#>>>(0x3c.l+0x12) uleshort !0 \b, InitStackSize 0x%x
# EntryPoint; segment offset value of CS:IP like: 0 10000h 18A84h 11C1Ah 307F1h
#>>>(0x3c.l+0x14) ulelong !0 \b, EntryPoint 0x%x
# InitStack; specifies the segment offset value of stack pointer SS:SP
# like: 0 20000h 160000h
#>>>(0x3c.l+0x18) ulelong !0 \b, InitStack 0x%x
# SegCount; number of segments in segment table like: 0 1 2 3 16h
#>>>(0x3c.l+0x1C) uleshort x \b, SegCount 0x%x
# ModRefs; number of module references (DLLs) like; 0 1 3
#>>>(0x3c.l+0x1E) uleshort !0 \b, ModRefs %u
# NoResNamesTabSiz; size in bytes of non-resident names table
# like: Bh 16h B4h B9h 2Ch 18Fh 16AAh
#>>>(0x3c.l+0x20) uleshort x \b, NoResNamesTabSiz 0x%x
# SegTableOffset; offset of Segment table like: 40h
#>>>(0x3c.l+0x22) uleshort !0x40 \b, SegTableOffset 0x%x
# ResTableOffset; offset of resources table like: 40h 50h 58h F0h
# 40h for most fonts likedos737.fon FMFONT.FOT but 60h for L1WBASE.FON
#>>>(0x3c.l+0x24) uleshort x \b, ResTableOffset 0x%x
# ResidNamTable; offset of resident names table
# like: 58h 5Ch 60h 68h 74h 98h 2E3h 2E7h 2F0h
#>>>(0x3c.l+0x26) uleshort x \b, ResidNamTable 0x%x
# ImportNameTable; offset of imported names table (array of counted strings, terminated with string of length 00h)
# like: 77h 7Eh 80h C6h A7h ACh 2F8h 3FFh
#>>>(0x3c.l+0x2a) uleshort x \b, ImportNameTable 0x%x
# OffStartNonResTab; offset from start of file to non-resident names table
# like: 110h 11Dh 19Bh 1A5h 3F5h 4C8h 4EEh D93h
#>>>(0x3c.l+0x2c) ulelong x \b, OffStartNonResTab 0x%x
# MovEntryCount; number of movable entry points like: 0 4 5 6 16 17 24 312 355 446
#>>>(0x3c.l+0x30) uleshort !0 \b, MovEntryCount %u
# FileAlnSzShftCnt; log2 of the segment sector size; 4~16 0~9~512 (default)
#>>>(0x3c.l+0x32) uleshort !9 \b, FileAlnSzShftCnt %u
# nResTabEntries; number of resource table entries like: 0 2
#>>>(0x3c.l+0x34) uleshort !0 \b, nResTabEntries %u
# Following fields are valid only for NE version 5+
>>>(0x3c.l+0x02) ubyte >4
# targOS; Target OS; 0~unspecified (OS/2 or Windows); detect it based on Windows-only flags and OS/2 specific import lib (DOSCALLS)
#>>>(0x3c.l+0x36) byte x TARGOS %x
>>>>(0x3c.l+0x36) byte 0
# if windows version is specified then it is windows binary
>>>>>(0x3c.l+0x3E) ushort !0 for MS Windows
>>>>>>(0x3c.l+0x3F) ubyte x %u
>>>>>>(0x3c.l+0x3E) ubyte x \b.%02u
>>>>>>(0x3c.l+0x3F) ubyte <3
>>>>>>>(0x3c.l+0x37) byte&0x04 0 (real mode only)
>>>>>>>(0x3c.l+0x37) byte&0x04 !0 (real+protected mode)
>>>>>>(0x3c.l+0x3E) ushort =0x0300
>>>>>>>(0x3c.l+0x0c) ubyte&0x08 0 (real+protected mode)
>>>>>>>(0x3c.l+0x0c) ubyte&0x08 !0 (protected mode only)
>>>>>(0x3c.l+0x3E) ushort 0
>>>>>>(0x3c.l+0x2a) leshort 0 for OS/2 1.x or MS Windows 1.x/2.x
>>>>>>(0x3c.l+0x2a) default x
# Binaries with DOSCALLS import library are for OS/2
>>>>>>>&(&0.s-0x29) search/512/C \x08DOSCALLS for OS/2 1.x
>>>>>>>(0x3c.l+0x2a) default x
# Binaries with KERNEL, USER or GDI import library are for Windows
# FIXME: names are prefixed by its length, but regex type does not support binary bytes
>>>>>>>>&(&0.s-0x29) regex/512/C KERNEL|USER|GDI for MS Windows 1.x/2.x
>>>>>>>>>(0x3c.l+0x37) byte&0x04 0 (real mode only)
>>>>>>>>>(0x3c.l+0x37) byte&0x04 !0 (real+protected mode)
# Binaries without any of those import library can be for any OS
>>>>>>>>(0x3c.l+0x2a) default x for OS/2 1.x or MS Windows 1.x/2.x
>>>>(0x3c.l+0x36) byte 1 for OS/2 1.x
>>>>(0x3c.l+0x36) byte 2 for MS Windows
# expctwinver; expected Windows version (minor first) like:
# 0.0~DTM.DLL 203.4~Windows 1.03 GDI.EXE 2.1~TTY.DRV 3.0~dos737.fon FMFONT.FOT THREED.VBX 3.10~GDI.EXE 4.0~(ME) VGAFULL.3GR
>>>>>(0x3c.l+0x3E) ushort !0
>>>>>>(0x3c.l+0x3F) ubyte x %u
>>>>>>(0x3c.l+0x3E) ubyte x \b.%02u
# Empty version is is treated by Windows 3.x OS as Windows 2.01 version and by Windows 2.x OS as Windows 1.01 version
>>>>>(0x3c.l+0x3E) ushort 0 1.x/2.x
>>>>>(0x3c.l+0x3F) ubyte <3
>>>>>>(0x3c.l+0x37) byte&0x04 0 (real mode only)
>>>>>>(0x3c.l+0x37) byte&0x04 !0 (real+protected mode)
>>>>>(0x3c.l+0x3E) ushort =0x0300
>>>>>>(0x3c.l+0x0c) ubyte&0x08 0 (real+protected mode)
>>>>>>(0x3c.l+0x0c) ubyte&0x08 !0 (protected mode only)
# Windows P-code application
# https://web.archive.org/web/20000304044656/http://msdn.microsoft.com/library/backgrnd/html/msdn_c7pcode2.htm
# https://library.thedatadungeon.com/msdn-1992-09/msjv7/html/msjv0g6a.content.htm
# https://en.wikipedia.org/wiki/P-code_machine#Microsoft_P-code
# Can be created by MSC7 or MSVC1.x CL.EXE /Oq switch which calls MPC.EXE
# MPC.EXE (Make P-Code utility) sets bit2 in MZ e_res[2] (e_flags) field
# Filter out false-positive Windows 3.x applications with OS/2 WLO loader
# (sets bit7 in NE ne_flagsothers) as they do not have MZ e_res[] fields
>>>>>(0x3c.l+0x3E) ushort >0x0300
>>>>>>(0x3c.l+0x37) ubyte&0x80 0
>>>>>>>0x20 ubyte&0x04 !0 \b, P-code application
# 32-bit Watcom Win386 extender in 16-bit Windows 3.x NE binaries
# https://www.os2museum.com/wp/watcom-win386/
# https://github.com/open-watcom/open-watcom-v2/blob/master/bld/win386/
# https://misc.daniel-marschall.de/spiele/blown_away/disassemble.php
# Examples: BA_LITE.EXE WALDO.EXE
>>>>>(0x3c.l+0x3E) ushort >0x0300
>>>>>>0x38 ulong !0
>>>>>>>(0x38.l) string MQ \b, Watcom Win386 extender
# OS 3 was reserved for Multitasking MS-DOS but it never used NE version 5+ (only NE version 4)
#>>>>(0x3c.l+0x36) byte 3 for Multitasking MS-DOS
# OS 4 was reserved for MS Windows/386 device drivers but MS Windows/386 2.x never used NE format (Xenix x.out format was used instead)
#>>>>(0x3c.l+0x36) byte 4 for MS Windows/386 device driver
# OS 5 is assigned to BOSS (Borland Operating System Services) but is used also by other 16-bit DOS applications
>>>>(0x3c.l+0x36) byte 5 for MS-DOS
# HDLD16.BIN
# x86 jmp near relative (0xe9 0x?? 0x??) + string "MI" (0x4d 0x49)
>>>>>(8.s*16) ulequad&0xffff0000ff =0x494d0000e9 \b, HX DOS extender 16-bit (embedded with DPMI host)
>>>>>(8.s*16) ulequad&0xffff0000ff !0x494d0000e9
# DPMIST16.BIN
>>>>>>(8.s*16) search/0x200 cannot\ find\ loader\ DPMILD16.EXE \b, HX DOS extender 16-bit (stub)
# DPMILD16.BIN
>>>>>>(8.s*16) search/0x4000 DPMILD16: \b, HX DOS extender 16-bit (embedded without DPMI host)
# TLINK.EXE or TD.EXE from TASM 5.0
>>>>>>(8.s*16) string 16STUB
>>>>>>>(8.s*16) search/0x1000 rtm.exe\0dpmi16bi.ovl \b, Borland rtm DOS extender (stub)
>>>>>>(8.s*16) string !16STUB
# TLINK.EXE or BRC.EXE from Borland Pascal 7.0
>>>>>>>(8.s*16) search/0x1000 BOSS\ Stub\ Version \b, Borland BOSS DOS extender (stub)
# OS 6 is not assigned but is used by 32-bit DOS application with extender (found only with HX DOS extender 32-bit)
# http://downloads.sourceforge.net/dfendreloaded/D-Fend-Reloaded-1.4.4.zip
# D-Fend Reloaded/VirtualHD/FREEDOS/DPMILD32.EXE
# https://www.japheth.de/HX/DPMILD32.TXT
>>>>(0x3c.l+0x36) byte 6 for MS-DOS
# HDLD32.BIN
# x86 jmp near relative (0xe9 0x?? 0x??) + string "MI" (0x4d 0x49)
>>>>>(8.s*16) ulequad&0xffff0000ff =0x494d0000e9 \b, HX DOS extender 32-bit (embedded with DPMI host)
>>>>>(8.s*16) ulequad&0xffff0000ff !0x494d0000e9
# DPMIST32.BIN
>>>>>>(8.s*16) search/0x200 cannot\ find\ loader\ DPMILD32.EXE \b, HX DOS extender 32-bit (stub)
# DPMILD32.BIN
>>>>>>(8.s*16) search/0x4000 DPMILD32: \b, HX DOS extender 32-bit (embedded without DPMI host)
# https://en.wikipedia.org/wiki/Phar_Lap_(company)
# like: TELLPROT.EXE from 286DEX
# can be created by BIND286.EXE from OS/2 NE binary
>>>>(0x3c.l+0x36) byte 0x81 for MS-DOS, Phar Lap 286 DOS extender, emulating OS/2 1.x
# like: CVP7.EXE from 286DEX
# can be created by BIND286.EXE from Windows NE binary
>>>>(0x3c.l+0x36) byte 0x82 for MS-DOS, Phar Lap 286 DOS extender, emulating MS Windows
>>>>>(0x3c.l+0x3E) ushort 0 1.x/2.x
>>>>>(0x3c.l+0x3E) ushort !0
>>>>>>(0x3c.l+0x3F) ubyte x %u
>>>>>>(0x3c.l+0x3E) ubyte x \b.%02u
>>>>(0x3c.l+0x36) default x
>>>>>(0x3c.l+0x36) ubyte x for unknown OS %#x
# OS2EXEFlags; other EXE flags
# 1~Long filename support 2~Win2.x proportional fonts 4~Win2.x protected mode 8~Executable has gangload area 10~Win9x thunk lib without DllEntryPoint 80~Win3.x app with OS/2 WLO loader
#>>>>(0x3c.l+0x37) byte !0 \b, OS2EXEFlags 0x%x
# gangstart; offset to start of gangload area like: 0 34h 58h 246h
#>>>>(0x3c.l+0x38) uleshort !0 \b, gangstart 0x%x
# ganglength; size of gangload area
# like: 0 33Eh 39Ah AEEh
#>>>>(0x3c.l+0x3A) uleshort !0 \b, ganglength 0x%x
# mincodeswap; minimum code swap area size like 0 620Ch
#>>>>(0x3c.l+0x3C) uleshort !0 \b, mincodeswap 0x%x
>>>>(0x3c.l+0x3F) ubyte =3
>>>>>0x3c ulelong >0x800
>>>>>>(0x3c.l+0x37) ubyte &0x80 with OS/2 WLO loader
# Detection for NE versions <5 which do not have OS type byte 0x36
# These versions are used only by WINE, Windows 1.x/2.x and Multitasking MS-DOS
# WINE binaries have special signature after the dos header (at fixed offset 0x40)
# Multitasking MS-DOS binaries imports DOSCALLS library, so use it for distinguishing
# Import libraries are part of the string table which starts one byte after the
# 16-bit indirect offset 0x2a relative to the beginning of NE header, and consist
# of concatenated pascal strings (first byte of the string is its length)
>>>(0x3c.l+0x02) ubyte <5
# like: fakedlls/krnl386.exe16 fakedlls/gdi.exe16 fakedlls/winsock.dll16 fakedlls/winoldap.mod16 fakedlls/mouse.drv16
>>>>0x40 string Wine\ placeholder\ DLL for WINE stub
>>>>(0x3c.l+0x2a) default x
# like: HE_DAEM.EXE POPUP.EXE QUEUER.EXE
>>>>>&(&0.s-0x29) search/512/C \x08DOSCALLS for Multitasking MS-DOS
>>>>>(0x3c.l+0x2a) default x for MS Windows 1.x/2.x
# Special case, Windows 3.x OS parse from NE version 4 binaries also following NE version 5 fields:
# - os type if is 0 or 2
# - bits proportional fonts and protected mode
# Such NE version 4 binary is treated by Windows 3.x OS as Windows 2.01
# compatible binary and by Windows 2.x OS as Windows 1.01 compatible binary.
# So if os type is correct (0 or 2; matched mask 0xfd) and at least one
# of those bits is set and others are cleared (matched mask 0xf9) then
# detect if binary has NE version 5 protected mode bit set.
>>>>>>(0x3c.l+0x36) leshort&0xf9fd 0
>>>>>>>(0x3c.l+0x37) byte&0x06 !0
>>>>>>>>(0x3c.l+0x37) byte&0x04 0 (real mode only)
>>>>>>>>(0x3c.l+0x37) byte&0x04 !0 (real+protected mode)
>>>>>>>(0x3c.l+0x37) default x (real mode only)
>>>>>>(0x3c.l+0x36) default x (real mode only)
# DRV: Driver
# 3GR: Grabber device driver
# CPL: Control Panel Item
# VBX: Visual Basic Extension https://en.wikipedia.org/wiki/Visual_Basic
# FON: Bitmap font http://fileformats.archiveteam.org/wiki/FON
# FOT: Font resource file
# EXE: WINSPOOL.EXE USER.EXE krnl386.exe GDI.EXE
# CNV: Microsoft Word text conversion https://www.file-extensions.org/cnv-file-extension-microsoft-word-text-conversion-data
>>>(0x3c.l+0x0c) leshort &0x8000
# Check segment count, if 0 then this is resource-only DLL
>>>>(0x3c.l+0x1c) leshort 0
>>>>>(0x3c.l+0x2c) lelong !0
>>>>>>(&-4.l+1) string/C FONTRES (DLL, font)
!:ext fon/fot
>>>>>>(&-4.l+1) default x (DLL, resource-only)
!:ext dll
>>>>>(0x3c.l+0x2c) lelong 0 (DLL, resource-only)
!:ext dll
>>>>(0x3c.l+0x1c) leshort !0
# Check description of the module, first word specifies type of the DLL library
>>>>>(0x3c.l+0x2c) lelong !0
>>>>>>(&-4.l+1) string/C DDRV (DLL, driver)
!:ext drv
>>>>>>(&-4.l+1) default x (DLL)
!:ext dll/drv/3gr/cpl/vbx
>>>>>(0x3c.l+0x2c) lelong 0 (DLL)
!:ext dll/drv/3gr/cpl/vbx
>>>(0x3c.l+0x0c) leshort&0x8000 0 (EXE)
!:ext exe/scr
>>>>(0x3c.l+0x0d) ubyte&0x07 =1 (full screen)
>>>>(0x3c.l+0x0d) ubyte&0x07 =2 (console)
>>>>(0x3c.l+0x0d) ubyte&0x07 =3 (GUI)
>>>&(&0x24.s-1) string ARJSFX \b, ARJ self-extracting archive
>>>(0x3c.l+0x70) search/0x80 WinZip(R)\ Self-Extractor \b, ZIP self-extracting archive (WinZip)
>>(0x3c.l) string LX \b, LX
!:mime application/x-dosexec
>>>(0x3c.l+0x2) uleshort =0x0000
>>>>(0x3c.l) use lx-executable
# no examples found for big endian variant
>>>(0x3c.l+0x2) uleshort =0x0101
>>>>(0x3c.l) use \^lx-executable
# no examples found for PDP-11 endian variant
>>>(0x3c.l+0x2) uleshort =0x0100
# PDP-11-endian is not supported by magic "use" keyword yet
# no examples found for other endian variants
>>>0 default x
# other endianity is not supported by magic "use" keyword
>>>(8.s*16) string emx \b, emx
>>>>&1 string x %s
>>>&(&0x54.l-3) string arjsfx \b, ARJ self-extracting archive
# MS Windows system file, supposedly a collection of LE executables
# like vmm32.vxd WIN386.EXE
>>(0x3c.l) string W3 \b, W3 for MS Windows
#!:mime application/x-dosexec
!:mime application/x-ms-w3-executable
>>>(0x3c.l+0x3) ubyte <4 %u
# Windows 3.x WIN386.EXE
!:ext exe
>>>(0x3c.l+0x3) ubyte >3 %u
# Windows 95 VMM32.VXD
!:ext vxd
>>>(0x3c.l+0x2) ubyte x \b.%02u
# W4 executable
>>(0x3c.l) string W4 \b, W4 for MS Windows
#!:mime application/x-dosexec
!:mime application/x-ms-w4-executable
# windows 98 VMM32.VXD
!:ext vxd
>>>(0x3c.l+0x3) ubyte x %u
>>>(0x3c.l+0x2) ubyte x \b.%02u
# Linear Executable (LE) in Little Endian (\0\0)
>>(0x3c.l) string LE\0\0 \b, LE
!:mime application/x-dosexec
>>>(0x3c.l+0x0a) leshort 1
# some DOS extenders use LE files with OS/2 header
>>>>0x240 search/0x100 DOS/4G for MS-DOS, DOS/4G DOS extender
>>>>0x240 search/0x200 WATCOM\ C/C++ for MS-DOS, DOS/4GW DOS extender
>>>>0x440 search/0x100 CauseWay\ DOS\ Extender for MS-DOS, CauseWay DOS extender
>>>>0x40 search/0x40 PMODE/W for MS-DOS, PMODE/W DOS extender
>>>>0x40 search/0x40 STUB/32A for MS-DOS, DOS/32A DOS extender (stub)
>>>>0x40 search/0x80 STUB/32C for MS-DOS, DOS/32A DOS extender (configurable stub)
>>>>0x40 search/0x80 DOS/32A for MS-DOS, DOS/32A DOS extender (embedded)
# D3XW.EXE
>>>>(8.s*16) string o2LEstub for MS-DOS, D3X DOS extender
>>>>0 default x
# DOS32MW.DLL
>>>>>(0x3c.l+0x10) lelong&0x38000 =0x18000 for MS-DOS (DLL)
!:ext dll
# HPFS.386 (HPFS386 filesystem for OS/2 1.x, part of Microsoft LAN Manager)
# https://www.os2museum.com/wp/os2-history/os2-16-bit-server/
# EXE module (&0x38000=0x00000) with zero application type (&0x700=0x000) and
# with no external fixups (&0x20=0x20) is .386 32-bit driver module for OS/2 1.x
>>>>>(0x3c.l+0x10) lelong&0x38720 =0x00020 for OS/2 1.x (driver)
!:ext 386
>>>>>0 default x for unknown OS 0x1
# this is a wild guess; hopefully it is a specific signature
>>>>&0x24 lelong <0x50
>>>>>(&0x4c.l) string \xfc\xb8WATCOM
>>>>>>&0 search/8 3\xdbf\xb9 \b, 32Lite compressed
# another wild guess: if real OS/2 LE executables exist, they probably have higher start EIP
#>>>>(0x3c.l+0x1c) lelong >0x10000 for OS/2
# fails with DOS-Extenders.
# OS 2 was reserved for MS Windows 16-bit but it never used LE (NE format was used instead)
#>>>(0x3c.l+0x0a) leshort 2 for MS Windows 16-bit
# OS 3 was reserved for Multitasking MS-DOS but it never used LE (NE format was used instead)
#>>>(0x3c.l+0x0a) leshort 3 for Multitasking MS-DOS
>>>(0x3c.l+0x0a) leshort 4 for MS Windows
>>>>(0x3c.l+0xc3) ubyte x %u
>>>>(0x3c.l+0xc2) ubyte x \b.%02u
>>>>(0x3c.l+0x10) lelong&0x38000 =0x08000
# DLL module (0x08000) with no external fixups (0x20) for i386 CPU (2) is .386 VxD file for MS Windows 3.x
>>>>>(0x3c.l+0x10) lelong&0x20 !0
>>>>>>(0x3c.l+0x08) leshort 2 (VxD 386)
!:ext 386
>>>>(0x3c.l+0x10) lelong&0x38000 =0x28000 (VxD static)
# VXD: VxD for MS Windows 95/98/Me
# PDR: Port driver
# MPD: Miniport driver (?)
!:ext vxd/pdr/mpd
>>>>(0x3c.l+0x10) lelong&0x38000 =0x38000 (VxD dynamic)
!:ext vxd/pdr/mpd
>>>(0x3c.l+0x0a) default x
>>>>(0x3c.l+0x0a) leshort x for unknown OS %#x
>>>(&0x7c.l+0x26) string UPX \b, UPX compressed
>>>&(&0x54.l-3) string UNACE \b, ACE self-extracting archive
# DOS/32A Linear Compressed file format
>>(0x3c.l) string LC\0\0 \b, LC for MS-DOS
>>>0x40 search/0x40 STUB/32A \b, DOS/32A DOS extender (stub)
>>>0x40 search/0x80 STUB/32C \b, DOS/32A DOS extender (configurable stub)
>>>0x40 search/0x80 DOS/32A \b, DOS/32A DOS extender (embedded)
# PX\0\0 signature for 32bit DOS Applications in DOS-PE Format (https://www.japheth.de/HX.html)
# SHDPMI.EXE, DOSTEST.EXE, GETVMODE.EXE, RMINT.EXE
>(0x3c.l) string PX\0\0 \b, PE32
>>(0x3c.l+24) leshort 0x020b \b+
>>0 clear x
>>0 default x executable for MS-DOS
# LOADPEX.BIN and HDLD32.BIN
# x86 jmp near relative (0xe9 0x?? 0x??) + string "MI" (0x4d 0x49)
>>(8.s*16) ulequad&0xffff0000ff =0x494d0000e9 \b, HX DOS extender (embedded with DPMI host)
>>(8.s*16) ulequad&0xffff0000ff !0x494d0000e9
# DPMIST32.BIN
>>>(8.s*16) search/0x200 cannot\ find\ loader\ DPMILD32.EXE \b, HX DOS extender (stub)
# LOADPE.BIN
>>>(8.s*16) search/0x600 PATH=HDPMI32.EXE \b, HX DOS extender (embedded without DPMI host)
# DPMILD32.BIN
>>>(8.s*16) search/0x4000 DPMILD32: \b, HX DOS extender (embedded without DPMI host)
>0 clear x
# Skip already parsed binary types
# If magic in the branch is not parsed then always jumps to mz-unrecognized
>(0x3c.l) string PE\0\0
>(0x3c.l) string PX\0\0
>(0x3c.l) string LX
>(0x3c.l) string NE
>>(0x3c.l-0x02) string !IMNE
>>>0x18 uleshort <0x40
>>>>0 use mz-unrecognized
>(0x3c.l) string W3
>>0x18 uleshort <0x40
>>>0 use mz-unrecognized
>(0x3c.l) string W4
>>0x18 uleshort <0x40
>>>0 use mz-unrecognized
>(0x3c.l) string LE\0\0
>>0x18 uleshort <0x40
>>>0 use mz-unrecognized
>(0x3c.l) string LC
>>0x18 uleshort <0x40
>>>0 use mz-unrecognized
>0 default x
# This sequence jumps to the next MZ overlay
>>2 leshort !0
# FIXME: Following line does not match binaries which total size is less than (4.s*512)
>>>(4.s*512) leshort x
>>>>&(2.s-514) leshort x
>>>>>&-2 use mz-next-overlay
>>>>>&-2 string BW
>>>>>>0 use mz-bw-collection
>>>>>&-2 string 3P
>>>>>>0 use mz-3p
>>>>0 default x
>>>>>0 use mz-unrecognized
>>>0 default x
>>>>0 use mz-unrecognized
>>2 leshort 0
>>>(4.s*512) leshort x
>>>>&-2 use mz-next-overlay
>>>>&-2 string BW
>>>>>0 use mz-bw-collection
>>>>&-2 string 3P
>>>>>0 use mz-3p
>>>0 default x
>>>>0 use mz-unrecognized
# Parse content of the COFF, executable type was already printed in mz-next-overlay
>(4.s*512) leshort 0x014c
#!:mime application/x-dosexec
# djgpp go32 v1 COFF
# F2C.EXE from f2c95201.zip or compress.exe from djdev112.zip
>>(&-6.l) string/b StubInfoMagic!!\0 for MS-DOS
# djgpp go32 v2 COFF
>>(8.s*16) string go32stub for MS-DOS
>>(8.s*16) string emx
>>>&1 string x for DOS, Win or OS/2, emx %s
>>&(&0x42.l-3) byte x
>>>&0x26 string UPX \b, UPX compressed
# and yet another guess: small .text, and after large .data is unusual, could be 32lite
>>&0x2c search/0xa0 .text
>>>&0x0b lelong <0x2000
>>>>&0 lelong >0x6000 \b, 32lite compressed
# Parse content of the a.out, executable type was already printed in mz-next-overlay
>(4.s*512) leshort 0x010b
# djgpp go32 v1 a.out
>>(&-6.l) string/b StubInfoMagic!!\0 for MS-DOS
# djgpp go32 v1
# Note that for "redirect" binaries is offset (4.s*512) behind end-of-file, so access it via "default"
>(4.s*512) clear x
>(4.s*512) default x
>>(&-4.l) string/b StubInfoMagic!!\0
>>>&0 lelong >39
>>>>&19 byte x \b, DJGPP go32 v%u
>>>>&18 byte x \b.%u
>>>>&17 byte x \b%c DOS extender (stub)
>>>&0 lelong <40 \b, DJGPP go32 v1 DOS extender (stub)
>>>&0 lelong >35
>>>>&0 byte !0
>>>>>&-1 string/16 x \b, autoload "%s"
>>>&0 lelong >62
>>>>&28 byte !0
# zcat.exe from djdev112.zip
>>>>>&-1 string/15 x \b, redirect to "%s"
# djgpp go32 v2
>(8.s*16) string go32stub
# Version string is usually ", v 2.05", so skip leading spaces
>>&0 string ,\ v\
>>>&0 string/4 x \b, DJGPP go32 v%s DOS extender
>>&0 default x
>>>&0 string/8 x \b, DJGPP go32 %s DOS extender
>>&8 lelong >43
>>>&24 byte 0
# check for embedded DPMI host PMODSTUB.EXE
>>>>0x1c string PMODSTUB.EXE (embedded PMODE/DJ)
>>>>0x1c string !PMODSTUB.EXE
>>>>>0x18 leshort 0
# check for the default djgpp stub
>>>>>>0x40 search/0x80 The\ STUB.EXE\ stub\ loader (stub)
>>>>>>>(8.s*16) default x
>>>>>>>>&8 lelong >83
>>>>>>>>>&56 byte !0
# show which DPMI host executable is autoloaded when none is running
>>>>>>>>>>&-1 string/16 x \b, autoload "%s"
>>>>>(0x18.s) default x
>>>>>>&(0x6.s*4) default x
# check for embedded DPMI host CWSDSTUB.EXE
>>>>>>>&0 search/16 CWSDPMI
>>>>>>>>&-7 regex/T =^CWSDPMI(\ [^\ ]+\ )? (embedded %s)
# check for embedded DPMI host D3XD.EXE
>>>>>>>&0 search/16 D3X
>>>>>>>>&-3 regex/T =^D3X(\ [^\ ]+\ )? (embedded %s)
>>>&24 byte !0
# djtarx.exe or dxegen.exe from djdev205.zip
>>>>&-1 string/8 x \b, redirect to "%s"
>(8.s*16) string $WdX \b, WDos/X DOS extender
# By now an executable type should have been printed out. The executable
# may be a self-uncompressing archive, so look for evidence of that and
# print it out.
#
# Some signatures below from Greg Roelofs, newt@uchicago.edu.
#
>0x35 string \x8e\xc0\xb9\x08\x00\xf3\xa5\x4a\x75\xeb\x8e\xc3\x8e\xd8\x33\xff\xbe\x30\x00\x05 \b, aPack compressed
>0xe7 string LH/2\ Self-Extract \b, %s
>0x1c string UC2X \b, UCEXE compressed
>0x1c string WWP\ \b, WWPACK compressed
>0x1c string RJSX \b, ARJ self-extracting archive
>0x1c string diet \b, diet compressed
>0x1c string LZ09 \b, LZEXE v0.90 compressed
>0x1c string LZ91 \b, LZEXE v0.91 compressed
>0x1c string tz \b, TinyProg compressed
>0x1e string Copyright\ 1989-1990\ PKWARE\ Inc. \b, Self-extracting PKZIP archive
!:mime application/zip
# Yes, this really is "Copr", not "Corp."
>0x1e string PKLITE\ Copr. \b, Self-extracting PKZIP archive
!:mime application/zip
# winarj stores a message in the stub instead of the sig in the MZ header
>0x20 search/0xe0 aRJsfX \b, ARJ self-extracting archive
>0x20 string AIN
>>0x23 string 2 \b, AIN 2.x compressed
>>0x23 string <2 \b, AIN 1.x compressed
>>0x23 string >2 \b, AIN 1.x compressed
>0x24 string LHa's\ SFX \b, LHa self-extracting archive
!:mime application/x-lha
>0x24 string LHA's\ SFX \b, LHa self-extracting archive
!:mime application/x-lha
>0x24 string \ $ARX \b, ARX self-extracting archive
>0x24 string \ $LHarc \b, LHarc self-extracting archive
>0x20 string SFX\ by\ LARC \b, LARC self-extracting archive
>0x40 string aPKG \b, aPackage self-extracting archive
>0x64 string W\ Collis\0\0 \b, Compack compressed
>0x7a string Windows\ self-extracting\ ZIP \b, ZIP self-extracting archive
>>&0xf4 search/0x140 \x0\x40\x1\x0
>>>(&0.l+(4)) string MSCF \b, WinHKI CAB self-extracting archive
>1638 string -lh5- \b, LHa self-extracting archive v2.13S
>0x17888 string Rar! \b, RAR self-extracting archive
# Skip to the end of the EXE. This will usually work fine in the PE case
# because the MZ image is hardcoded into the toolchain and almost certainly
# won't match any of these signatures.
>(4.s*512) long x
>>&(2.s-517) byte x
>>>&0 string PK\3\4 \b, ZIP self-extracting archive
>>>&0 string Rar! \b, RAR self-extracting archive
>>>&0 string =!\x11 \b, AIN 2.x self-extracting archive
>>>&0 string =!\x12 \b, AIN 2.x self-extracting archive
>>>&0 string =!\x17 \b, AIN 1.x self-extracting archive
>>>&0 string =!\x18 \b, AIN 1.x self-extracting archive
>>>&7 search/400 **ACE** \b, ACE self-extracting archive
>>>&0 search/0x480 UC2SFX\ Header \b, UC2 self-extracting archive
# a few unknown ZIP sfxes, no idea if they are needed or if they are
# already captured by the generic patterns above
>(8.s*16) search/0x20 PKSFX \b, ZIP self-extracting archive (PKZIP)
# TODO: how to add this? >FileSize-34 string Windows\ Self-Installing\ Executable \b, ZIP self-extracting archive
#
# TELVOX Teleinformatica CODEC self-extractor for OS/2:
>49801 string \x79\xff\x80\xff\x76\xff \b, CODEC archive v3.21
>>49824 leshort =1 \b, 1 file
>>49824 leshort >1 \b, %u files
# This named instance is called for multi overlay MZ executable with offset of the next overlay
0 name mz-next-overlay
>0 string P2 \b, EXP (P2) for MS-DOS, Phar Lap 286 DOS extender
>0 string P3 \b, EXP (P3) for MS-DOS, Phar Lap 386 DOS extender
>0 string MT \b, MT for MS-DOS, IGC XMLOD i386 DOS extender
>0 string 3P \b, 3P for MS-DOS
# Other 3P details are printed later as they depend on the original MZ content
>>32 lelong&0x00000001 !0 \b, 16-bit
>>32 lelong&0x00000001 0
# CWC.EXE from cw349bin.zip is 32-bit
>>>32 lelong&0x00010000 0 \b, 32-bit
# WL32.EXE from cw349bin.zip is dual mode
>>>32 lelong&0x00010000 !0 \b, Dual mode
>>32 lelong&0x80000000 !0 \b, Compressed
>0 string D3X1 \b, D3X1 for MS-DOS, D3X DOS extender
# BW details are printed later as they depend on the original MZ content
>0 string BW \b, BW collection for MS-DOS
# a.out details are printed later as they depend on the original MZ content
>0 leshort 0x010b \b, a.out
# COFF details are printed later as they depend on the original MZ content
>0 leshort 0x014c \b, COFF
>0 default x
# now make offset aligned to 0x10
>>0 offset%0x10 0x0
# already aligned
>>>0x0 use mz-next-overlay-aligned
>>0 offset%0x10 0x1
>>>0xf use mz-next-overlay-aligned
>>0 offset%0x10 0x2
>>>0xe use mz-next-overlay-aligned
>>0 offset%0x10 0x3
>>>0xd use mz-next-overlay-aligned
>>0 offset%0x10 0x4
>>>0xc use mz-next-overlay-aligned
>>0 offset%0x10 0x5
>>>0xb use mz-next-overlay-aligned
>>0 offset%0x10 0x6
>>>0xa use mz-next-overlay-aligned
>>0 offset%0x10 0x7
>>>0x9 use mz-next-overlay-aligned
>>0 offset%0x10 0x8
>>>0x8 use mz-next-overlay-aligned
>>0 offset%0x10 0x9
>>>0x7 use mz-next-overlay-aligned
>>0 offset%0x10 0xa
>>>0x6 use mz-next-overlay-aligned
>>0 offset%0x10 0xb
>>>0x5 use mz-next-overlay-aligned
>>0 offset%0x10 0xc
>>>0x4 use mz-next-overlay-aligned
>>0 offset%0x10 0xd
>>>0x3 use mz-next-overlay-aligned
>>0 offset%0x10 0xe
>>>0x2 use mz-next-overlay-aligned
>>0 offset%0x10 0xf
>>>0x1 use mz-next-overlay-aligned
0 name mz-next-overlay-aligned
>0 string MP \b, EXP (MP) for MS-DOS, Phar Lap 386 DOS extender
>0 default x
>>0 use mz-unrecognized
# This named instance is called for unrecognized MZ DOS binary from any offset
0 name mz-unrecognized
>0 default x \b, MZ for MS-DOS
!:mime application/x-dosexec
# Windows and later versions of DOS will allow .EXEs to be named with a .COM
# extension, mostly for compatibility's sake.
# like: EDIT.COM 4DOS.COM CMD8086.COM CMD-FR.COM SYSLINUX.COM
# URL: https://en.wikipedia.org/wiki/Personal_NetWare#VLM
# Reference: https://mark0.net/download/triddefs_xml.7z/defs/e/exe-vlm-msg.trid.xml
# also like: BGISRV.DRV
!:ext exe/com/vlm/drv
# This named instance is called for BW collection with offset from the beginning of the file
0 name mz-bw-collection
>(8.s*16) default x
>>&(&0x30.s) default x
>>>&0 string DOS/16M \b, DOS/16M DOS extender (embedded)
>>>&-8 string DOS/16M \b, DOS/16M DOS extender (embedded)
>>>&-8 string DOS/4G \b, DOS/4G DOS extender (embedded)
>>>0 default x
>>>>(8.s*16) search/0x4000 Stub\ failed\ to\ find\ DOS/4G\ extender. \b, DOS/4G DOS extender (stub)
# This named instance is called for CauseWay MZ 3P binary with offset from the beginning of the file
0 name mz-3p
# CWC.EXE and WL32.EXE from cw349bin.bin
>0x440 search/0x100 CauseWay\ DOS\ Extender \b, CauseWay DOS extender
# CWHELP.EXE from cw349bin.bin
>0x200 search/0x100 CauseWay\ dynamic\ link\ library \b, CauseWay DLL
# Summary: OS/2 LX Library and device driver (no DOS stub)
# From: Joerg Jenderek
# URL: http://en.wikipedia.org/wiki/EXE
# Reference: http://www.textfiles.com/programming/FORMATS/lxexe.txt
# https://github.com/open-watcom/open-watcom-v2/blob/master/bld/watcom/h/exeflat.h
# https://github.com/bitwiseworks/os2tk45/blob/master/h/exe386.h
# https://archive.org/download/IBMOS2Warp4ToolkitDocuments2/lxref.htm
# Note: by dll-os2-no-dos-stub.trid.xml called "OS/2 Dynamic Link Library (no DOS stub)"
# similar looking like variant with MS-DOS stub (MZ magic): "MS-DOS executable, LX"
0 string/b LX LX executable
#!:mime application/x-msdownload
!:mime application/x-lx-executable
>2 uleshort =0x0000
>>0 use lx-executable
# no examples found for big endian variant
>2 uleshort =0x0101
>>0 use \^lx-executable
# no examples found for PDP-11 endian variant
>2 uleshort =0x0100
# PDP-11-endian is not supported by magic "use" keyword yet
# no examples found for other endian variants
>>0 default x
# other endianity is not supported by magic "use" keyword
0 name lx-executable
# FOR DEBUGGING!
# byte order: 00h~little-endian 01h~big-endian
#>0x02 ubyte =0 \b, little-endian byte order
#>0x02 ubyte =1 \b, big-endian word order
# word order: 00h~little-endian 01h~big-endian
#>0x03 ubyte =0 \b, little-endian word order
#>0x03 ubyte =1 \b, big-endian word order
# cpu_type; CPU type like: 1~i286 2~i386 3~i486 4~i586 20h~i860-N10 21h~i860-N11 40h~MIPS R2000,R3000 41h~MIPS R6000 42h~MIPS R4000
#>0x08 uleshort x \b, CPU %u
# os_type; target operating system like: 0~unknown 1~OS/2 2~Windows 16-bit 3~Multitasking MS-DOS 4.x 4~Windows 386 5~IBM Microkernel PN
#>0x0A leshort x \b, OS %u
# flags; module type flags
#>0x10 ulelong x \b, FLAGS %#8.8x
# 00000002h ~Reserved for system use
#>0x10 ulelong &0x00000002 \b, 2h reserved
# OSF_INIT_INSTANCE=00000004h ~Per-Process Library Initialization; setting this bit for EXE file is invalid
#>0x10 ulelong &0x00000004 \b, per-process library Initialization
#>0x10 ulelong &0x00000008 \b, system dll
# OSF_INTERNAL_FIXUPS_DONE=00000010h ~Internal fixups for the module have been applied
#>0x10 ulelong &0x00000010 \b, int. fixup
# OSF_EXTERNAL_FIXUPS_DONE=00000020h ~External fixups for the module have been applied
#>0x10 ulelong &0x00000020 \b, ext. fixup
# OSF_NOT_PM_COMPATIBLE=00000100h ~Incompatible with PM windowing
#>0x10 ulelong&0x00000700 =0x00000100 \b, incompatible with PM windowing
# OSF_PM_COMPATIBLE=00000200h ~Compatible with PM windowing
#>0x10 ulelong&0x00000700 =0x00000200 \b, compatible with PM windowing
#>0x10 ulelong&0x00000700 =0x00000300 \b, uses PM windowing API
#>0x10 ulelong &0x00002000 \b, not loadable
#>0x10 ulelong &0x00008000 \b, library module
# bit 17; device driver
#>0x10 ulelong &0x00020000 \b, device driver
#>0x10 ulelong &0x00080000 \b, multiple-processor unsafe
# Per-process Library Termination; setting this bit for EXE file is invalid
#>0x10 ulelong &0x40000000 \b, per-process library termination
# OS type
>0x0a clear x
>0x0a leshort 1 for OS/2
# OS 2 was reserved for MS Windows 16-bit but it never used LX (NE format was used instead)
#>0x0a leshort 2 for MS Windows 16-bit
# OS 3 was reserved for Multitasking MS-DOS but it never used LX (NE format was used instead)
#>0x0a leshort 3 for Multitasking MS-DOS
# OS 4 was reserved for MS Windows device drivers but it never used LX (LE format was used instead)
#>0x0a leshort 4 for MS Windows
# OS 5 was reserved for IBM Microkernel Personality Neutral but it never used LX (the only released IBM Workplace OS for PowerPC used ELF format)
#>0x0a leshort 5 for IBM Microkernel Personality Neutral
>0x0a default x
>>0x0a leshort x for unknown OS %#x
# http://www.ctyme.com/intr/rb-2939.htm#Table1610
# library by module type mask 00038000h (bits 15-17);
# 0h ~executable Program module
>0x10 ulelong&0x00038000 =0x00000000 (EXE)
!:ext exe
# bits 8-10; OSF_PM_APP=700h in flags ~Uses PM windowing API; either it is GUI or console
>>0x10 ulelong&0x00000700 =0x00000100 (full screen)
>>0x10 ulelong&0x00000700 =0x00000200 (console)
>>0x10 ulelong&0x00000700 =0x00000300 (GUI)
>0x10 ulelong&0x00038000 =0x00008000 (DLL)
!:ext dll
>0x10 ulelong&0x00038000 =0x00010000 (unknown)
>0x10 ulelong&0x00038000 =0x00018000 (PMDLL)
>0x10 ulelong&0x00038000 =0x00020000 (PDD)
!:ext sys
>0x10 ulelong&0x00038000 =0x00028000 (VDD)
!:ext sys
>0x10 ulelong&0x00038000 =0x00030000 (DLD)
>0x10 ulelong&0x00038000 =0x00038000 (unknown)
# CPU type
>0x08 clear x
>0x08 uleshort 1 \b, Intel i286
# all inspected examples
>0x08 uleshort 2 \b, Intel i386
>0x08 uleshort 3 \b, Intel i486
>0x08 uleshort 4 \b, Intel i586
# 20h Intel i860 N10 or compatible
# 21h Intel i860 N11 or compatible
# 40h MIPS Mark I ( R2000, R3000) or compatible
# 41h MIPS Mark II ( R6000 ) or compatible
# 42h MIPS Mark III ( R4000 ) or compatible
>0x08 default x
>>0x08 uleshort x \b, unknown CPU %#x
# Endianity for debugging, there are no samples for non-little-endian
#>0x02 clear x
#>0x02 uleshort =0x0000 (little-endian)
#>0x02 uleshort =0x0101 (big-endian)
#>0x02 uleshort =0x0100 (PDP-11-endian)
#>0x02 default x (unknown-endian)
# added by Joerg Jenderek of https://www.freedos.org/software/?prog=kc
# and https://www.freedos.org/software/?prog=kpdos
# for FreeDOS files like KEYBOARD.SYS, KEYBRD2.SYS, KEYBRD3.SYS, *.KBD
0 string/b KCF FreeDOS KEYBoard Layout collection
# only version=0x100 found
>3 uleshort x \b, version %#x
# length of string containing author,info and special characters
>6 ubyte >0
#>>6 pstring x \b, name=%s
>>7 string >\0 \b, author=%-.14s
>>7 search/254 \xff \b, info=
#>>>&0 string x \b%-s
>>>&0 string x \b%-.15s
# for FreeDOS *.KL files
0 string/b KLF FreeDOS KEYBoard Layout file
# only version=0x100 or 0x101 found
>3 uleshort x \b, version %#x
# stringlength
>5 ubyte >0
>>8 string x \b, name=%-.2s
0 string \xffKEYB\ \ \ \0\0\0\0
>12 string \0\0\0\0`\004\360 MS-DOS KEYBoard Layout file
# DOS device driver updated by Joerg Jenderek at May 2011,Mar 2017,Aug 2020,Mar 2023
# URL: http://fileformats.archiveteam.org/wiki/DOS_device_driver
# Reference: http://www.delorie.com/djgpp/doc/rbinter/it/46/16.html
# http://www.o3one.org/hwdocs/bios_doc/dosref22.html
0 ulequad&0x07a0ffffffff 0xffffffff
# skip OS/2 INI ./os2
>4 ubelong !0x14000000
#>>10 ubequad x MAYBE_DRIVER_NAME=%16.16llx
# https://bugs.astron.com/view.php?id=434
# skip OOXML document fragment 0000.dat where driver name is "empty" instead of "ASCII like"
>>10 ubequad !0
>>>0 use msdos-driver
0 name msdos-driver DOS executable (
#!:mime application/octet-stream
!:mime application/x-dosdriver
# also found FreeDOS print driver SPOOL.DEV and disc compression driver STACLOAD.BIN
# and IBM Token-Ring adapter IBMTOK.DOS. Why and when DOS instead SYS is used?
# PROTMAN.DOS ELNKPL.DOS
!:ext sys/dev/bin/dos
# 1 space char after "UPX compressed" to get phrase like "UPX compressed character device"
>40 search/7 UPX! \bUPX compressed
# DOS device driver attributes
>4 uleshort&0x8000 0x0000 \bblock device driver
# character device
>4 uleshort&0x8000 0x8000 \b
# 1 space char after "clock" to get phrase like "clock character device driver CLOCK$"
>>4 uleshort&0x0008 0x0008 \bclock
# fast video output by int 29h
# 1 space char after "fast" to get phrase like "fast standard input/output character device driver"
>>4 uleshort&0x0010 0x0010 \bfast
# standard input/output device
# 1 space char after "standard" to get phrase like "standard input/output character device driver"
>>4 uleshort&0x0003 >0 \bstandard
>>>4 uleshort&0x0001 0x0001 \binput
>>>4 uleshort&0x0003 0x0003 \b/
# 1 space char after "output" to get phrase like "input/output character device driver"
>>>4 uleshort&0x0002 0x0002 \boutput
>>4 uleshort&0x8000 0x8000 \bcharacter device driver
>0 ubyte x
# upx compressed device driver has garbage instead of real in name field of header
>>40 search/7 UPX!
>>40 default x
# leading/trailing nulls, zeros or non ASCII characters in 8-byte name field at offset 10 are skipped
# 1 space char before device driver name to get phrase like "device driver PROTMAN$" "device driver HP-150II" "device driver PC$MOUSE"
>>>12 ubyte >0x23 \b
>>>>10 ubyte >0x20
>>>>>10 ubyte !0x2E
>>>>>>10 ubyte !0x2A \b%c
>>>>11 ubyte >0x20
>>>>>11 ubyte !0x2E \b%c
>>>>12 ubyte >0x20
>>>>>12 ubyte !0x39
>>>>>>12 ubyte !0x2E \b%c
>>>13 ubyte >0x20
>>>>13 ubyte !0x2E \b%c
>>>>14 ubyte >0x20
>>>>>14 ubyte !0x2E \b%c
>>>>15 ubyte >0x20
>>>>>15 ubyte !0x2E \b%c
>>>>16 ubyte >0x20
>>>>>16 ubyte !0x2E
>>>>>>16 ubyte <0xCB \b%c
>>>>17 ubyte >0x20
>>>>>17 ubyte !0x2E
>>>>>>17 ubyte <0x90 \b%c
# some character device drivers like ASPICD.SYS, btcdrom.sys and Cr_atapi.sys contain only spaces or points in name field
>>>12 ubyte <0x2F
# they have their real name at offset 22
# also block device drivers like DUMBDRV.SYS
>>>>22 string >\056 %-.6s
>4 uleshort&0x8000 0x0000
# 32 bit sector addressing ( > 32 MB) for block devices
>>4 uleshort&0x0002 0x0002 \b,32-bit sector-
# support by driver functions 13h, 17h, 18h
>4 uleshort&0x0040 0x0040 \b,IOCTL-
# open, close, removable media support by driver functions 0Dh, 0Eh, 0Fh
>4 uleshort&0x0800 0x0800 \b,close media-
# output until busy support by int 10h for character device driver
>4 uleshort&0x8000 0x8000
>>4 uleshort&0x2000 0x2000 \b,until busy-
# direct read/write support by driver functions 03h,0Ch
>4 uleshort&0x4000 0x4000 \b,control strings-
>4 uleshort&0x8000 0x8000
>>4 uleshort&0x6840 >0 \bsupport
>4 uleshort&0x8000 0x0000
>>4 uleshort&0x4842 >0 \bsupport
>0 ubyte x \b)
>0 ulelong !0xffffffff with pointer %#x
# DOS driver cmd640x.sys has 0x12 instead of 0xffffffff for pointer field to next device header
0 ulequad 0x0513c00000000012
>0 use msdos-driver
# DOS drivers DC2975.SYS, DUMBDRV.SYS, ECHO.SYS has also none 0xffffffff for pointer field
0 ulequad 0x32f28000ffff0016
>0 use msdos-driver
0 ulequad 0x007f00000000ffff
>0 use msdos-driver
# https://www.uwe-sieber.de/files/cfg_echo.zip
0 ulequad 0x001600000000ffff
>0 use msdos-driver
# DOS drivers LS120.SYS, MKELS120.SYS use reserved bits of attribute field
0 ulequad 0x0bf708c2ffffffff
>0 use msdos-driver
0 ulequad 0x07bd08c2ffffffff
>0 use msdos-driver
# 3Com EtherLink 3C501 CID\SERVER\IBMLS\IBM500D1\DLSNETDR.ZIP\ELNK.DOS
0 ulequad 0x027ac0c0ffffffff
>0 use msdos-driver
# IBM Streamer CID\SERVER\IBMLS\IBM500D1\DLSNETDR.ZIP\IBMMPC.DOS
0 ulequad 0x00228880ffffffff
>0 use msdos-driver
# updated by Joerg Jenderek
# GRR: line below too general as it catches also
# rt.lib DYADISKS.PIC and many more
# start with assembler instruction MOV
0 ubyte 0x8c
# skip "AppleWorks word processor data" like ARTICLE.1 ./apple
>4 string !O====
# skip some unknown basic binaries like RocketRnger.SHR
>>5 string !MAIN
# skip "GPG symmetrically encrypted data" ./gnu
# skip "PGP symmetric key encrypted data" ./pgp
# openpgpdefs.h: fourth byte < 14 indicate cipher algorithm type
>>>4 ubyte >13
>>>>0 use msdos-com
# the remaining files should be DOS *.COM executables
# dosshell.COM 8cc0 2ea35f07 e85211 e88a11 b80058 cd
# hmload.COM 8cc8 8ec0 bbc02b 89dc 83c30f c1eb04 b4
# UNDELETE.COM 8cca 2e8916 6503 b430 cd21 8b 2e0200 8b
# BOOTFIX.COM 8cca 2e8916 9603 b430 cd21 8b 2e0200 8b
# RAWRITE3.COM 8cca 2e8916 d602 b430 cd21 8b 2e0200 8b
# SHARE.COM 8cca 2e8916 d602 b430 cd21 8b 2e0200 8b
# validchr.COM 8cca 2e8916 9603 b430 cd21 8b 2e028b1e
# devload.COM 8cca 8916ad01 b430 cd21 8b2e0200 892e
0 name msdos-com
# URL: http://fileformats.archiveteam.org/wiki/DOS_executable_(.com)
>0 byte x DOS executable (
# DOS executable with JuMP 16-bit instruction
>0 byte =0xE9
# check for probably nil padding til offset 64 of Lotus driver name
>>56 quad =0
# check for "long" alphabetic Lotus driver name like:
# Diablo "COMPAQ Text Display" "IBM Monochrome Display" "Plantronics ColorPlus"
>>>24 regex =^[A-Z][A-Za-z\040]{5,21} \bLotus driver) %s
!:mime application/x-dosexec
# like: CPQ0TD.DRV IBM0MONO.DRV (Lotus 123 10a) SDIAB4.DRV SPL0CPLS.DRV (Lotus Symphony 2)
!:ext drv
# COM with nils like MODE.COM IBMDOS.COM (pcdos 3.31 ru Compaq) RSSTUB.COM (PC-DOS 2000 de) ACCESS.COM (Lotus Symphony 1)
>>>24 default x \bCOM)
!:mime application/x-dosexec
!:ext com
# DOS executable with JuMP 16-bit and without nil padding
>>56 quad !0
# https://wiki.syslinux.org/wiki/index.php?title=Doc/comboot
# TODO: HOWTO distinguish COMboot from pure DOS executables?
# look for unreliable Syslinux specific api call INTerrupt 22h for 16-bit COMBOOT program
>>>1 search/0xc088 \xcd\x22 \bCOM or COMBOOT 16-bit)
!:mime application/x-dosexec
# like: sbm.cbt command.com (Windows XP) UNI2ASCI.COM (FreeDOS 1.2)
!:ext com/cbt
>>>1 default x \bCOM)
!:mime application/x-dosexec
!:ext com
# DOS executable without JuMP 16-bit instruction
>0 byte !0xE9
# SCREATE.SYS https://en.wikipedia.org/wiki/Stac_Electronics
>>10 string =?STACVOL \bSCREATE.SYS)
!:mime application/x-dosexec
!:ext sys
# COM executable without JuMP 16-bit instruction and not SCREATE.SYS
>>10 string !?STACVOL \bCOM)
!:mime application/x-dosexec
!:ext com
>6 string SFX\ of\ LHarc \b, %s
>0x1FE leshort 0xAA55 \b, boot code
>85 string UPX \b, UPX compressed
>4 string \ $ARX \b, ARX self-extracting archive
>4 string \ $LHarc \b, LHarc self-extracting archive
>0x20e string SFX\ by\ LARC \b, LARC self-extracting archive
# like: E30ODI.COM MADGEODI.COM UNI2ASCI.COM RECOVER.COM (DOS 2) COMMAND.COM (DOS 2)
>1 search/0xc088 \xcd\x22 \b, maybe with interrupt 22h
>0 ubelong x \b, start instruction %#8.8x
# show more instructions but not in samples like: rem.com (DJGPP)
>4 ubelong x %8.8x
# JMP 8bit
0 byte 0xeb
# byte 0xeb conflicts with magic leshort 0xn2eb of "SYMMETRY i386" handled by ./sequent
# allow forward jumps only
>1 byte >-1
# that offset must be accessible
# with hexadecimal values like: 0e 2e 50 8c 8d ba bc bd be e8 fb fc
>>(1.b+2) byte x
# if look like COM executable with x86 boot signature then this
# implies FAT volume with x86 real mode code already handled by ./filesystems
#
# No x86 boot signature implies often DOS executable
# check for unrealistic high number of FATs. Then it is an unusual disk image or often a DOS executable
# like: FIXBIOS.COM (50 bytes)
>>>16 ubyte >3
# https://www.drivedroid.io/
# skip MBR disk image drivedroid.img version 12 July 2013 by start message
>>>>2 string !DriveDroid
# ftp://old-dos.ru/OSCollect/OS/MS-DOS/Final Releases/
# skip unusual floppy image disk1.img of MS-DOS 1.25 (Corona Data Systems OEM)
# by check for characteristic message text near the beginning
>>>>>15 string !Non\040System\040disk
# "ftp://old-dos.ru/OSCollect/OS/BeOS/BeOS 4.0.rar"
# skip BeOS 4 bootfloppy.img done as "Linux kernel x86 boot executable" by ./linux
# by check for characteristic message text near the beginning
>>>>>>6 string !read\040error\015
# https://github.com/ventoy/Ventoy/releases/download/v1.0.78/ventoy-1.0.78-windows.zip
# skip ventoy 1.0.78 boot_hybrid.img
>>>>>>>24 string !\220\220\353I$\022\017
# "ftp://old-dos.ru/OSCollect/OS/MS-DOS/Final Releases/PC-DOS 1.0 (5.25).rar"
# skip unusual floppy image PCDOS100.IMG of DOS 1.0
# by check for characteristic message text near the beginning
>>>>>>>>9 string !7-May-81
# "ftp://old-dos.ru/OSCollect/OS/BeOS/BeOS 5.0 Personal (BA).rar"
# skip BeOS 5 floppy_1.44.00.ima done as "DOS/MBR boot sector" by ./filesystems
# by check for characteristic message near the beginning
>>>>>>>>>3 string !\370sdfS\270
# like: FIXBIOS.COM (50 bytes)
>>>>>>>>>>0 use msdos-com
# check for unrealistic low number of FATs. Then it is an unusual FAT disk image or often a DOS executable
# like: DEVICE.COM INSTALL.COM (GAG 4.10) WORD.COM (Word 1.15)
>>>16 ubyte =0
# if low FATs with x86 boot signature it can be unusual disk image like: boot.img (Ventoy 1.0.27) geodspms.img (Syslinux)
>>>>0x1FE leshort =0xAA55
>>>>0x1FE default x
# https://thestarman.pcministry.com/tool/hxd/dimtut.htm
# skip unusual floppy image TK-DOS11.img IBMDOS11.img of IBM DOS 1.10
# by check for characteristic bootloader names near end of boot sector
>>>>>395 string !ibmbio\040\040com
>>>>>>0 use msdos-com
# 8-bit jump with valid number of FAT implies FAT volume already handled by ./filesystems
# like: balder.img
>>>16 default x
# skip disk images with boot signature at end of 1st sector
# like: TDSK-64b.img
>>>>(11.s-2) uleshort !0xAA55
# skip unusual floppy image without boot signature like 360k-256.img (mtools 4.0.18)
# by check for characteristic file system type text for FAT (12 bit or 16 bit)
>>>>>54 string !FAT
# "ftp://old-dos.ru/OSCollect/OS/MS-DOS/Final Releases/Microsoft MS-DOS 3.31 (Compaq OEM) (3.5).rar"
# skip unusual floppy image Disk4.img without boot signature and file system type text
# by check for characteristic OEM-ID text
>>>>>>3 string !COMPAQ\040\040
# no such DOS COM executables found
>>>>>>>0 use msdos-com
# JMP 16bit
0 byte 0xe9
# display DOS executable (COM or COMBOOT 16-bit strength=40=40-0) after ESP-IDF application image (strength=40=40+0) handled by ./firmware
#!:strength -0
# 16-bit offset; for DEBUGGING!; can be negative like: USBDRIVE.COM
# 2h (CPQ0TD.DRV) 4FEh (NDN.COM) 581h (DRMOUSE.COM) 1FDh (GAG.COM) BE07h (USBDRIVE.COM)
#>1 uleshort x \b, OFFSET=%#4.4x
#>1 leshort x \b, OFFSET %d
# forward jumps
>1 leshort >-1
# that offset must be accessible
# with hexadecimal values like: 06 1e 0e 2e 60 8c 8d b4 ba be e8 fc
>>(1.s+3) byte x
# check for unrealistic high number of FATs. Then it is not a disk image and it is a DOS executable
# like: CALLVER.COM CPUCACHE.COM K437_EUR.COM SHSUCDX.COM UMBFILL.COM (183 bytes)
>>>16 ubyte >3
>>>>0 use msdos-com
# check for unrealistic low number of FATs. Then it is not a disk image and it is a DOS executable
# like: GAG.COM DRMOUSE.COM NDN.COM CPQ0TD.DRV
# or ESP-IDF application image like: WLED_0.14.0_ESP32-C3.bin opendtu-generic_esp32.bin
>>>16 ubyte =0
# skip ESP-IDF application image handled by ./firmware with ESP_APP_DESC_MAGIC_WORD
>>>>32 ulelong !0xABCD5432
>>>>>0 use msdos-com
# maybe disc image with valid number of FATs or DOS executable
# like: IPXODI.COM PERUSE.COM TASKID.COM
>>>16 default x
# invalid low media descriptor. Then it is not a disk image and it is a DOS executable
>>>>21 ubyte <0xE5
>>>>>0 use msdos-com
# valid media descriptor. Then it is maybe disk image or DOS executable
>>>>21 ubyte >0xE4
# invalid sectorsize not a power of 2 from 32-32768. Then it is not a disk image and it must be DOS executable
# like: LEARN.COM (Word 1.15)
>>>>>11 uleshort&0x001f !0
>>>>>>0 use msdos-com
# negative offset, must not lead into PSP
# like: BASICA.COM (PC dos 3.20) FORMAT.COM SMC8100.COM WORD.COM (word4)
# HIDSUPT1.COM USBDRIVE.COM USBSUPT1.COM USBUHCI.COM (FreeDOS USBDOS)
>1 leshort <-259
# that offset must be accessible
# add 10000h to jump at end of 64 KiB segment, add 1 for jump instruction and 2 for 16-bit offset
>>(1,s+65539) byte x
# after jump next instruction for DEBUGGING!
#>>>&-1 ubelong x \b, NEXT instruction %#8.8x
>>>0 use msdos-com
# updated by Joerg Jenderek at Oct 2008,2015,2022
# following line is too general
0 ubyte 0xb8
# skip 2 linux kernels like memtest.bin with "\xb8\xc0\x07\x8e" in ./linux
>0 string !\xb8\xc0\x07\x8e
# modified by Joerg Jenderek
# syslinux COM32 or COM32R executable
>>1 lelong&0xFFFFFFFe 0x21CD4CFe COM executable (32-bit COMBOOT
# https://www.syslinux.org/wiki/index.php/Comboot_API
# Since version 5.00 c32 modules switched from the COM32 object format to ELF
!:mime application/x-c32-comboot-syslinux-exec
!:ext c32
# https://syslinux.zytor.com/comboot.php
# older syslinux version ( <4 )
# (32-bit COMBOOT) programs *.C32 contain 32-bit code and run in flat-memory 32-bit protected mode
# start with assembler instructions mov eax,21cd4cffh
>>>1 lelong 0x21CD4CFf \b)
# syslinux:doc/comboot.txt
# A COM32R program must start with the byte sequence B8 FE 4C CD 21 (mov
# eax,21cd4cfeh) as a magic number.
# syslinux version (4.x)
# "COM executable (COM32R)" or "Syslinux COM32 module" by TrID
>>>1 lelong 0x21CD4CFe \b, relocatable)
>>1 default x
# look for interrupt instruction like in rem.com (DJGPP) LOADER.COM (DR-DOS 7.x)
>>>3 search/118 \xCD
# FOR DEBUGGING; possible hexadecimal interrupt number like: 10~BANNER.COM 13~bcdw_cl.com 15~poweroff.com (Syslinux)
# 1A~BERNDPCI.COM 20~SETENHKB.COM 21~mostly 22~gfxboot.com (Syslinux) 2F~SHUTDOWN.COM (GEMSYS)
#>>>>&0 ubyte x \b, INTERUPT %#x
# few examples with interrupt 0x13 instruction
>>>>&0 ubyte =0x13
# FOR DEBUGGING!
#>>>>>3 ubequad x \b, 2nd INSTRUCTION %#16.16llx
# skip Gpt.com Mbr.com (edk2-UDK2018 bootsector) described as "DOS/MBR boot sector" by ./filesystems
# by check for assembler instructions: mov es,ax ; mov ax,07c0h ; mov ds,ax
>>>>>3 ubequad !0x8ec0b8c0078ed88d
# few COM executables with interrupt 0x13 instruction like: Bootable CD Wizard executables bcdw_cl.com fdemuoff.com
# http://bootcd.narod.ru/bcdw150z_en.zip
>>>>>>0 use msdos-com
# few examples with interrupt 0x16 instruction like flashimg.img
>>>>&0 ubyte =0x16
# skip Syslinux 3.71 flashimg.img done as "DOS/MBR boot sector" by ./filesystems
# by check for assembler instructions: cmp ax 0xE4E4 (magic); jnz
>>>>>8 ubelong !0x3DE4E475
# no DOS executable with interrupt 0x16 found
>>>>>>0 use msdos-com
# most examples with interrupt instruction unequal 0x13 and 0x16
>>>>&0 default x
#>>>>>&-1 ubyte x \b, INTERUPT %#x
# like: LOADER.COM SETENHKB.COM banner.com copybs.com gif2raw.com poweroff.com rem.com
>>>>>0 use msdos-com
# few COM executables without interrupt instruction like RESTART.COM (DOS 7.10) REBOOT.COM
# or some EUC-KR text files or one Ulead Imaginfo thumbnail
>>>3 default x
# FOR DEBUGGING; 2nd instruction like 0x50 (RESTART.COM) 0x8e (REBOOT.COM)
# or random like: 0x0 (IMAGINFO.PE3 sky_snow) 0xb1 (euckr_.txt)
#>>>>3 ubyte x \b, 2nd INSTRUCTION %#x
# skip 1 Ulead Imaginfo thumbnail (IMAGINFO.PE3 sky_snow)
# inside SAMPLES/TEXTURES/SKY_SNOW
# from https://archive.org/download/PI3CANON/PI3CANON.iso
>>>>3 ubyte !0x0
# skip some EUC-KR text files like: euckr_falsepositive.txt
# https://bugs.astron.com/view.php?id=186
>>>>>3 ubyte !0xb1
# like: RESTART.COM (DOS 7.10) REBOOT.COM
>>>>>>0 use msdos-com
# URL: https://en.wikipedia.org/wiki/UPX
# Reference: https://github.com/upx/upx/archive/v3.96.zip/upx-3.96/
# src/stub/src/i086-dos16.com.S
# Update: Joerg Jenderek
# assembler instructions: cmp sp, offset sp_limit
0 string/b \x81\xfc
#>2 uleshort x \b, sp_limit=%#x
# assembler instructions: jump above +2; int 0x20; mov cx, offset bytes_to_copy
>4 string \x77\x02\xcd\x20\xb9
#>9 uleshort x \b, [bytes_to_copy]=%#x
# at different offsets assembler instructions: push di; jump decomp_start_n2b
>0x1e search/3 \x57\xe9
#>>&0 uleshort x \b, decomp_start_n2b=%#x
# src/stub/src/include/header.S; UPX_MAGIC_LE32
>>&2 string UPX! FREE-DOS executable (COM), UPX
!:mime application/x-dosexec
# UPX compressed *.CPI; See ./fonts
>>>&21 string =FONT compressed DOS code page font
!:ext cpx
>>>&21 string !FONT compressed
!:ext com
# compressed size?
#>>>&14 uleshort+152 x \b, %u bytes
# uncompressed len
>>>&12 uleshort x \b, uncompressed %u bytes
252 string Must\ have\ DOS\ version DR-DOS executable (COM)
!:mime application/x-dosexec
!:ext com
# GRR search is not working
#2 search/28 \xcd\x21 COM executable for MS-DOS
#WHICHFAT.cOM
2 string \xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#DELTREE.cOM DELTREE2.cOM
4 string \xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#IFMEMDSK.cOM ASSIGN.cOM COMP.cOM
5 string \xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#DELTMP.COm HASFAT32.cOM
7 string \xcd\x21
>0 byte !0xb8 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#COMP.cOM MORE.COm
10 string \xcd\x21
>5 string !\xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#comecho.com
13 string \xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
#HELP.COm EDIT.coM
18 string \xcd\x21
# not printable before it?
>17 byte >32
>>17 byte <126
>>17 default x COM executable for MS-DOS
!:mime application/x-dosexec
!:ext com
#NWRPLTRM.COm
23 string \xcd\x21 COM executable for MS-DOS
!:mime application/x-dosexec
!:ext com
#LOADFIX.cOm LOADFIX.cOm
30 string \xcd\x21 COM executable for MS-DOS
!:mime application/x-dosexec
!:ext com
#syslinux.com 3.11
70 string \xcd\x21 COM executable for DOS
!:mime application/x-dosexec
!:ext com
# many compressed/converted COMs start with a copy loop instead of a jump
0x6 search/0xa \xfc\x57\xf3\xa5\xc3 COM executable for MS-DOS
!:mime application/x-dosexec
!:ext com
0x6 search/0xa \xfc\x57\xf3\xa4\xc3 COM executable for DOS
!:mime application/x-dosexec
!:ext com
>0x18 search/0x10 \x50\xa4\xff\xd5\x73 \b, aPack compressed
0x3c string W\ Collis\0\0 COM executable for MS-DOS, Compack compressed
!:mime application/x-dosexec
!:ext com
# FIXME: missing diet .com compression
# miscellaneous formats
0 string/b LZ MS-DOS executable (built-in)
#0 byte 0xf0 MS-DOS program library data
#
# AAF files:
# <stuartc@rd.bbc.co.uk> Stuart Cunningham
0 string/b \320\317\021\340\241\261\032\341AAFB\015\000OM\006\016\053\064\001\001\001\377 AAF legacy file using MS Structured Storage
>30 byte 9 (512B sectors)
>30 byte 12 (4kB sectors)
0 string/b \320\317\021\340\241\261\032\341\001\002\001\015\000\002\000\000\006\016\053\064\003\002\001\001 AAF file using MS Structured Storage
>30 byte 9 (512B sectors)
>30 byte 12 (4kB sectors)
# Popular applications
#
# Update: Joerg Jenderek
# URL: http://fileformats.archiveteam.org/wiki/DOC
# Reference: https://web.archive.org/web/20170206041048/
# http://www.msxnet.org/word2rtf/formats/ffh-dosword5
# wIdent+dty
0 belong 0x31be0000
# skip droid skeleton like x-fmt-274-signature-id-488.doc
>128 ubyte >0 Microsoft
>>96 uleshort =0 Word
!:mime application/msword
!:apple MSWDWDBN
# DCX is used in the Unix version.
!:ext doc/dcx
>>>0x6E ulequad =0 1.0-4.0
>>>0x6E ulequad !0 5.0-6.0
>>>0x6E ulequad x (DOS) Document
# https://web.archive.org/web/20130831064118/http://msxnet.org/word2rtf/formats/write.txt
>>96 uleshort !0 Write 3.0 (Windows) Document
!:mime application/x-mswrite
!:apple MSWDWDBN
# sometimes also doc like in splitter.doc srchtest.doc
!:ext wri/doc
# wTool must be 0125400 octal
#>>4 uleshort !0xAB00 \b, wTool %o
# reserved; must be zero
#>>6 ulelong !0 \b, reserved %u
# block pointer to the block containing optional file manager information
#>>0x1C uleshort x \b, at %#x info block
# jump to File manager information block
>>(0x1C.s*128) uleshort x
# test for valid information start; maybe also 0012h
>>>&-2 uleshort =0x0014
# Document ASCIIZ name
>>>>&0x12 string x %s
# author name
>>>>>&1 string x \b, author %s
# reviser name
>>>>>>&1 string x \b, reviser %s
# keywords
>>>>>>>&1 string x \b, keywords %s
# comment
>>>>>>>>&1 string x \b, comment %s
# version number
>>>>>>>>>&1 string x \b, version %s
# date of last change MM/DD/YY
>>>>>>>>>>&1 string x \b, %-.8s
# creation date MM/DD/YY
>>>>>>>>>>&9 string x created %-.8s
# file name of print format like NORMAL.STY
>>0x1E string >0 \b, formatted by %-.66s
# count of pages in whole file for write variant; maybe some times wrong
>>96 uleshort >0 \b, %u pages
# name of the printer driver like HPLASMS
>>0x62 string >0 \b, %-.8s printer
# number of blocks used in the file; seems to be 0 for Word 4.0 and Write 3.0
>>0x6A uleshort >0 \b, %u blocks
# bit field for corrected text areas
#>>0x6C uleshort x \b, %#x bit field
# text of document; some times start with 4 non printable characters like CR LF
>>128 ubyte x \b,
>>>128 ubyte >0x1F
>>>>128 string x %s
>>>128 ubyte <0x20
>>>>129 ubyte >0x1F
>>>>>129 string x %s
>>>>129 ubyte <0x20
>>>>>130 ubyte >0x1F
>>>>>>130 string x %s
>>>>>130 ubyte <0x20
>>>>>>131 ubyte >0x1F
>>>>>>>131 string x %s
>>>>>>131 ubyte <0x20
>>>>>>>132 ubyte >0x1F
>>>>>>>>132 string x %s
>>>>>>>132 ubyte <0x20
>>>>>>>>133 ubyte >0x1F
>>>>>>>>>133 string x %s
#
0 string/b PO^Q` Microsoft Word 6.0 Document
!:mime application/msword
#
4 long 0
>0 belong 0xfe320000 Microsoft Word for Macintosh 1.0
!:mime application/msword
!:ext mcw
>0 belong 0xfe340000 Microsoft Word for Macintosh 3.0
!:mime application/msword
!:ext mcw
>0 belong 0xfe37001c Microsoft Word for Macintosh 4.0
!:mime application/msword
!:ext mcw
>0 belong 0xfe370023 Microsoft Word for Macintosh 5.0
!:mime application/msword
!:ext mcw
0 string/b \333\245-\0\0\0 Microsoft Word 2.0 Document
!:mime application/msword
!:ext doc
# Note: seems already recognized as "OLE 2 Compound Document" in ./ole2compounddocs
#512 string/b \354\245\301 Microsoft Word Document
#!:mime application/msword
#
0 string/b \xDB\xA5\x2D\x00 Microsoft WinWord 2.0 Document
!:mime application/msword
#
0 string/b \x09\x04\x06\x00\x00\x00\x10\x00 Microsoft Excel Worksheet
!:mime application/vnd.ms-excel
# https://www.macdisk.com/macsigen.php
!:apple XCELXLS4
!:ext xls
#
# Update: Joerg Jenderek
# URL: https://en.wikipedia.org/wiki/Lotus_1-2-3
# Reference: http://www.aboutvb.de/bas/formate/pdf/wk3.pdf
# Note: newer Lotus versions >2 use longer BOF record
# record type (BeginningOfFile=0000h) + length (001Ah)
0 belong 0x00001a00
# reserved should be 0h but 8c0dh for TUTMAC.WK3, 5h for SAMPADNS.WK3, 1h for a_readme.wk3, 1eh for K&G86.WK3
#>18 uleshort&0x73E0 0
# Lotus Multi Byte Character Set (LMBCS=1-31)
>20 ubyte >0
>>20 ubyte <32 Lotus 1-2-3
#!:mime application/x-123
!:mime application/vnd.lotus-1-2-3
!:apple ????L123
# (version 5.26) labeled the entry as "Lotus 1-2-3 wk3 document data"
>>>4 uleshort 0x1000 WorKsheet, version 3
!:ext wk3
# (version 5.26) labeled the entry as "Lotus 1-2-3 wk4 document data"
>>>4 uleshort 0x1002 WorKsheet, version 4
# also worksheet template 4 (.wt4)
!:ext wk4/wt4
# no example or documentation for wk5
#>>4 uleshort 0x???? WorKsheet, version 4
#!:ext wk5
# only MacrotoScript.123 example
>>>4 uleshort 0x1003 WorKsheet, version 97
# also worksheet template Smartmaster (.12M)?
!:ext 123
# only Set_Y2K.123 example
>>>4 uleshort 0x1005 WorKsheet, version 9.8 Millennium
!:ext 123
# no example for this version
>>>4 uleshort 0x8001 FoRMatting data
!:ext frm
# (version 5.26) labeled the entry as "Lotus 1-2-3 fm3 or fmb document data"
# TrID labeles the entry as "Formatting Data for Lotus 1-2-3 worksheet"
>>>4 uleshort 0x8007 ForMatting data, version 3
!:ext fm3
>>>4 default x unknown
# file revision sub code 0004h for worksheets
>>>>6 uleshort =0x0004 worksheet
!:ext wXX
>>>>6 uleshort !0x0004 formatting data
!:ext fXX
# main revision number
>>>>4 uleshort x \b, revision %#x
>>>6 uleshort =0x0004 \b, cell range
# active cellcoord range (start row, page,column ; end row, page, column)
# start values normally 0~1st sheet A1
>>>>8 ulelong !0
>>>>>10 ubyte >0 \b%d*
>>>>>8 uleshort x \b%d,
>>>>>11 ubyte x \b%d-
# end page mostly 0
>>>>14 ubyte >0 \b%d*
# end raw, column normally not 0
>>>>12 uleshort x \b%d,
>>>>15 ubyte x \b%d
# Lotus Multi Byte Character Set (1~cp850,2~cp851,...,16~japan,...,31~??)
>>>>20 ubyte >1 \b, character set %#x
# flags
>>>>21 ubyte x \b, flags %#x
>>>6 uleshort !0x0004
# record type (FONTNAME=00AEh)
>>>>30 search/29 \0\xAE
# variable length m (2) + entries (1) + ?? (1) + LCMBS string (n)
>>>>>&4 string >\0 \b, 1st font "%s"
#
# Update: Joerg Jenderek
# URL: http://fileformats.archiveteam.org/wiki/Lotus_1-2-3
# Reference: http://www.schnarff.com/file-formats/lotus-1-2-3/WSFF2.TXT
# Note: Used by both old Lotus 1-2-3 and Lotus Symphony (DOS) til version 2.x
# record type (BeginningOfFile=0000h) + length (0002h)
0 belong 0x00000200
# GRR: line above is too general as it catches also MS Windows CURsor
# to display MS Windows cursor (strength=70) before Lotus 1-2-3 (strength=70-1)
!:strength -1
# skip Windows cursors with image height <256 and keep Lotus with low opcode 0001-0083h
>7 ubyte 0
# skip Windows cursors with image width 256 and keep Lotus with positive opcode
>>6 ubyte >0 Lotus
# !:mime application/x-123
!:mime application/vnd.lotus-1-2-3
!:apple ????L123
# revision number (0404h = 123 1A, 0405h = Lotus Symphony , 0406h = 123 2.x wk1 , 8006h = fmt , ...)
# undocumented; (version 5.26) labeled the configurations as "Lotus 1-2-3"
>>>4 uleshort 0x0007 1-2-3 CoNFiguration, version 2.x (PGRAPH.CNF)
!:ext cnf
>>>4 uleshort 0x0C05 1-2-3 CoNFiguration, version 2.4J
!:ext cnf
>>>4 uleshort 0x0801 1-2-3 CoNFiguration, version 1-2.1
!:ext cnf
>>>4 uleshort 0x0802 Symphony CoNFiguration
!:ext cnf
>>>4 uleshort 0x0804 1-2-3 CoNFiguration, version 2.2
!:ext cnf
>>>4 uleshort 0x080A 1-2-3 CoNFiguration, version 2.3-2.4
!:ext cnf
>>>4 uleshort 0x1402 1-2-3 CoNFiguration, version 3.x
!:ext cnf
>>>4 uleshort 0x1450 1-2-3 CoNFiguration, version 4.x
!:ext cnf
# (version 5.26) labeled the entry as "Lotus 123"
# TrID labeles the entry as "Lotus 123 Worksheet (generic)"
>>>4 uleshort 0x0404 1-2-3 WorKSheet, version 1
# extension "wks" also for Microsoft Works document
!:ext wks
# (version 5.26) labeled the entry as "Lotus 123"
# TrID labeles the entry as "Lotus 123 Worksheet (generic)"
>>>4 uleshort 0x0405 Symphony WoRksheet, version 1.0
!:ext wrk/wr1
# (version 5.26) labeled the entry as "Lotus 1-2-3 wk1 document data"
# TrID labeles the entry as "Lotus 123 Worksheet (V2)"
>>>4 uleshort 0x0406 1-2-3/Symphony worksheet, version 2
# Symphony (.wr1)
!:ext wk1/wr1
# no example for this japan version
>>>4 uleshort 0x0600 1-2-3 WorKsheet, version 1.xJ
!:ext wj1
# no example or documentation for wk2
#>>>4 uleshort 0x???? 1-2-3 WorKsheet, version 2
#!:ext wk2
# undocumented japan version
>>>4 uleshort 0x0602 1-2-3 worksheet, version 2.4J
!:ext wj3
# (version 5.26) labeled the entry as "Lotus 1-2-3 fmt document data"
>>>4 uleshort 0x8006 1-2-3 ForMaTting data, version 2.x
# japan version 2.4J (fj3)
!:ext fmt/fj3
# no example for this version
>>>4 uleshort 0x8007 1-2-3 FoRMatting data, version 2.0
!:ext frm
# (version 5.26) labeled the entry as "Lotus 1-2-3"
>>>4 default x unknown worksheet or configuration
!:ext cnf
>>>>4 uleshort x \b, revision %#x
# 2nd record for most worksheets describes cells range
>>>6 use lotus-cells
# 3rd record for most japan worksheets describes cells range
>>>(8.s+10) use lotus-cells
# check and then display Lotus worksheet cells range
0 name lotus-cells
# look for type (RANGE=0006h) + length (0008h) at record begin
>0 ubelong 0x06000800 \b, cell range
# cell range (start column, row, end column, row) start values normally 0,0~A1 cell
>>4 ulong !0
>>>4 uleshort x \b%d,
>>>6 uleshort x \b%d-
# end of cell range
>>8 uleshort x \b%d,
>>10 uleshort x \b%d
# EndOfLotus123
0 string/b WordPro\0 Lotus WordPro
!:mime application/vnd.lotus-wordpro
0 string/b WordPro\r\373 Lotus WordPro
!:mime application/vnd.lotus-wordpro
# Summary: Script used by InstallScield to uninstall applications
# Extension: .isu
# Submitted by: unknown
# Modified by (1): Abel Cheung <abelcheung@gmail.com> (replace useless entry)
0 string \x71\xa8\x00\x00\x01\x02
>12 string Stirling\ Technologies, InstallShield Uninstall Script
# Winamp .avs
#0 string Nullsoft\ AVS\ Preset\ \060\056\061\032 A plug in for Winamp ms-windows Freeware media player
0 string/b Nullsoft\ AVS\ Preset\ Winamp plug in
# Windows Metafile .WMF
# URL: http://fileformats.archiveteam.org/wiki/Windows_Metafile
# http://en.wikipedia.org/wiki/Windows_Metafile
# Reference: https://winprotocoldoc.blob.core.windows.net/productionwindowsarchives/MS-WMF/%5bMS-WMF%5d.pdf
# http://mark0.net/download/triddefs_xml.7z/defs/w/wmf.trid.xml
# Note: called "Windows Metafile" by TrID and
# verified by ImageMagick `identify -verbose *.wmf` as WMF (Windows Meta File)
# META_PLACEABLE Record (Aldus Placeable Metafile signature)
0 string/b \327\315\306\232
# Note: called "Windows Metafile Image with Placeable File Header" by DROID via PUID x-fmt/119
# and verified by XnView `nconvert -info abydos.wmf SPA_FLAG.wmf hardcopy-windows-meta.wmf` as "Windows Placeable metafile"
# skip failed libreoffice-7.3.2.2 ofz35149-1.wmf with invalid version 2020h and exttextout-2.wmf with invalid version 3a02h
# and x-fmt-119-signature-id-609.wmf without version instead of 0100h=METAVERSION100 or 0300h=METAVERSION300
>26 uleshort&0xFDff =0x0100 Windows metafile
# HWmf; resource handle to the metafile; When the metafile is on disk, this field MUST contain 0
# seems to be always true but in failed samples 2020h ofz35149-1.wmf 56f8h exttextout-2.wmf
>>4 uleshort !0 \b, resource handle %#x
# BoundingBox; the rectangle in the playback context measured in logical units for displaying
# sometimes useful like: hardcopy-windows-meta.wmf (0,0 / 1280,1024)
# but garbage in x-fmt-119-signature-id-609.wmf (-21589,-21589 / -21589,-21589)
#>>6 ubequad x \b, bounding box %#16.16llx
# Left; x-coordinate of the upper-left corner of the rectangle
>>6 leshort x \b, bounding box (%d
# Top; y-coordinate upper-left corner
>>8 leshort x \b,%d
# Right; x-coordinate lower-right corner
>>10 leshort x / %d
# Bottom; y-coordinate lower-right corner
>>12 leshort x \b,%d)
# Inch; number of logical units per inch like: 72 96 575 576 1000 1200 1439 1440 2540
>>14 uleshort x \b, dpi %u
# Reserved; field is not used and MUST be set to 0; but ababababh in x-fmt-119-signature-id-609.wmf
>>16 ulelong !0 \b, reserved %#x
# Checksum; checksum for the previous 10 words
>>20 uleshort x \b, checksum %#x
# META_HEADER Record after META_PLACEABLE Record
>>22 use wmf-head
# GRR: no example for type 2 (DISKMETAFILE) variant found under few thousands WMF
0 string/b \002\000\011\000 Windows metafile
>0 use wmf-head
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/w/wmf-16.trid.xml
# Note: called "Windows Metafile (old Win 3.x format)" by TrID and
# "Windows Metafile Image without Placeable File Header" by DROID via PUID x-fmt/119
# verified by XnView `nconvert -info *.wmf` as Windows metafile
# variant with type=1=MEMORYMETAFILE and valid HeaderSize 9
0 string/b \001\000\011\000
# skip DROID x-fmt-119-signature-id-1228.wmf by looking for content after header (18 bytes=2*011)
>18 ulelong >0 Windows metafile
# GRR: in version 5.44 unequal and not endian variant not working!
#>18 ulelong !0 THIS_SHOULD_NOT_HAPPEN
#>18 long !0 THIS_SHOULD_NOT_HAPPEN
>>0 use wmf-head
# display information of Windows metafile header (type, size, objects)
0 name wmf-head
# MetafileType: 0001h=MEMORYMETAFILE~Metafile is stored in memory 0002h=DISKMETAFILE~Metafile is stored on disk
>0 uleshort !0x0001 \b, type %#x
# HeaderSize; the number of WORDs in header record; seems to be always 9 (18 bytes)
>2 uleshort*2 !18 \b, header size %u
# MetafileVersion: 0100h=METAVERSION100~DIBs (device-independent bitmaps) not supported 0300h=METAVERSION300~DIBs are supported
# but in failed samples 2020h ofz35149-1.wmf 3a02h exttextout-2.wmf
>4 uleshort =0x0100 \b, DIBs not supported
>4 uleshort =0x0300
#>4 uleshort =0x0300 \b, DIBs supported
# this should not happen!
>4 default x \b, version
>>4 uleshort x %#x
# Size; the number of WORDs in the entire metafile
>6 ulelong x \b, size %u words
#>6 ulelong*2 x \b, size %u bytes
!:mime image/wmf
!:ext wmf
# NumberOfObjects: the number of graphics objects like: 0 hardcopy-windows-meta.wmf 1 2 3 4 5 6 7 8 9 12 13 14 16 17 20 27 110 PERSGRID.WMF
>10 uleshort x \b, %u objects
# MaxRecord: the size of the largest record in the metafile in WORDs like: 78h b0h 1f4h 310h 63fh 1e0022h 3fcc21h
>12 ulelong x \b, largest record size %#x
# NumberOfMembers: It SHOULD be 0x0000, but 5 TestBitBltStretchBlt.wmf 13 TestPalette.wmf and in failed samples 4254 bitcount-1.wmf 8224 ofz5942-1.wmf 56832 exttextout-2.wmf
>16 uleshort !0 \b, %u members
#tz3 files whatever that is (MS Works files)
0 string/b \003\001\001\004\070\001\000\000 tz3 ms-works file
0 string/b \003\002\001\004\070\001\000\000 tz3 ms-works file
0 string/b \003\003\001\004\070\001\000\000 tz3 ms-works file
# PGP sig files .sig
#0 string \211\000\077\003\005\000\063\237\127 065 to \027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\077\003\005\000\063\237\127\065\027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\077\003\005\000\063\237\127\066\027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\077\003\005\000\063\237\127\067\027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\077\003\005\000\063\237\127\070\027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\077\003\005\000\063\237\127\071\027\266\151\064\005\045\101\233\021\002 PGP sig
0 string \211\000\225\003\005\000\062\122\207\304\100\345\042 PGP sig
# windows zips files .dmf
0 string/b MDIF\032\000\010\000\000\000\372\046\100\175\001\000\001\036\001\000 MS Windows special zipped file
# Windows icons
# Update: Joerg Jenderek
# URL: https://en.wikipedia.org/wiki/CUR_(file_format)
# Note: similar to Windows CURsor. container for BMP (only DIB part) or PNG
0 belong 0x00000100
>9 byte 0
>>0 byte x
>>0 use cur-ico-dir
>9 ubyte 0xff
>>0 byte x
>>0 use cur-ico-dir
# displays number of icons and information for icon or cursor
0 name cur-ico-dir
# skip some Lotus 1-2-3 worksheets, CYCLE.PIC and keep Windows cursors with
# 1st data offset = dir header size + n * dir entry size = 6 + n * 10h = ?6h
>18 ulelong &0x00000006
# skip remaining worksheets, because valid only for DIB image (40) or PNG image (\x89PNG)
>>(18.l) ulelong x MS Windows
>>>0 ubelong 0x00000100 icon resource
# https://www.iana.org/assignments/media-types/image/vnd.microsoft.icon
!:mime image/vnd.microsoft.icon
#!:mime image/x-icon
!:ext ico
>>>>4 uleshort x - %d icon
# plural s
>>>>4 uleshort >1 \bs
# 1st icon
>>>>0x06 use ico-entry
# 2nd icon
>>>>4 uleshort >1
>>>>>0x16 use ico-entry
>>>0 ubelong 0x00000200 cursor resource
#!:mime image/x-cur
!:mime image/x-win-bitmap
!:ext cur
>>>>4 uleshort x - %d icon
>>>>4 uleshort >1 \bs
# 1st cursor
>>>>0x06 use cur-entry
#>>>>0x16 use cur-entry
# display information of one cursor entry
0 name cur-entry
>0 use cur-ico-entry
>4 uleshort x \b, hotspot @%dx
>6 uleshort x \b%d
# display information of one icon entry
0 name ico-entry
>0 use cur-ico-entry
# normally 0 1 but also found 14
>4 uleshort >1 \b, %d planes
# normally 0 1 but also found some 3, 4, some 6, 8, 24, many 32, two 256
>6 uleshort >1 \b, %d bits/pixel
# display shared information of cursor or icon entry
0 name cur-ico-entry
>0 byte =0 \b, 256x
>0 byte !0 \b, %dx
>1 byte =0 \b256
>1 byte !0 \b%d
# number of colors in palette
>2 ubyte !0 \b, %d colors
# reserved 0 FFh
#>3 ubyte x \b, reserved %x
#>8 ulelong x \b, image size %d
# offset of PNG or DIB image
#>12 ulelong x \b, offset %#x
# PNG header (\x89PNG)
>(12.l) ubelong =0x89504e47
# 1 space char after "with" to get phrase "with PNG image" by magic in ./images
>>&-4 indirect x \b with
# DIB image
>(12.l) ubelong !0x89504e47
#>>&-4 use dib-image
# Windows non-animated cursors
# Update: Joerg Jenderek
# URL: https://en.wikipedia.org/wiki/CUR_(file_format)
# Note: similar to Windows ICOn. container for BMP ( only DIB part)
# GRR: line below is too general as it catches also Lotus 1-2-3 files
0 belong 0x00000200
>9 byte 0
>>0 use cur-ico-dir
>9 ubyte 0xff
>>0 use cur-ico-dir
# .chr files
0 string/b PK\010\010BGI Borland font
>4 string >\0 %s
# then there is a copyright notice
# .bgi files
0 string/b pk\010\010BGI Borland device
>4 string >\0 %s
# then there is a copyright notice
# Windows Recycle Bin record file (named INFO2)
# By Abel Cheung (abelcheung AT gmail dot com)
# Version 4 always has 280 bytes (0x118) per record, version 5 has 800 bytes
# Since Vista uses another structure, INFO2 structure probably won't change
# anymore. Detailed analysis in:
# http://www.cybersecurityinstitute.biz/downloads/INFO2.pdf
0 lelong 0x00000004
>12 lelong 0x00000118 Windows Recycle Bin INFO2 file (Win98 or below)
0 lelong 0x00000005
>12 lelong 0x00000320 Windows Recycle Bin INFO2 file (Win2k - WinXP)
# From Doug Lee via a FreeBSD pr
9 string GERBILDOC First Choice document
9 string GERBILDB First Choice database
9 string GERBILCLIP First Choice database
0 string GERBIL First Choice device file
9 string RABBITGRAPH RabbitGraph file
0 string DCU1 Borland Delphi .DCU file
0 string =!<spell> MKS Spell hash list (old format)
0 string =!<spell2> MKS Spell hash list
# Too simple - MPi
#0 string AH Halo(TM) bitmapped font file
0 lelong 0x08086b70 TurboC BGI file
0 lelong 0x08084b50 TurboC Font file
# Debian#712046: The magic below identifies "Delphi compiled form data".
# An additional source of information is available at:
# http://www.woodmann.com/fravia/dafix_t1.htm
0 string TPF0
>4 pstring >\0 Delphi compiled form '%s'
# tests for DBase files moved, updated and merged to database
0 string PMCC Windows 3.x .GRP file
1 string RDC-meg MegaDots
>8 byte >0x2F version %c
>9 byte >0x2F \b.%c file
# .PIF files added by Joerg Jenderek from https://smsoft.ru/en/pifdoc.htm
# only for windows versions equal or greater 3.0
0x171 string MICROSOFT\ PIFEX\0 Windows Program Information File
!:mime application/x-dosexec
!:ext pif
#>2 string >\0 \b, Title:%.30s
>0x24 string >\0 \b for %.63s
>0x65 string >\0 \b, directory=%.64s
>0xA5 string >\0 \b, parameters=%.64s
#>0x181 leshort x \b, offset %x
#>0x183 leshort x \b, offsetdata %x
#>0x185 leshort x \b, section length %x
>0x187 search/0xB55 WINDOWS\ VMM\ 4.0\0
>>&0x5e ubyte >0
>>>&-1 string <PIFMGR.DLL \b, icon=%s
#>>>&-1 string PIFMGR.DLL \b, icon=%s
>>>&-1 string >PIFMGR.DLL \b, icon=%s
>>&0xF0 ubyte >0
>>>&-1 string <Terminal \b, font=%.32s
#>>>&-1 string =Terminal \b, font=%.32s
>>>&-1 string >Terminal \b, font=%.32s
>>&0x110 ubyte >0
>>>&-1 string <Lucida\ Console \b, TrueTypeFont=%.32s
#>>>&-1 string =Lucida\ Console \b, TrueTypeFont=%.32s
>>>&-1 string >Lucida\ Console \b, TrueTypeFont=%.32s
#>0x187 search/0xB55 WINDOWS\ 286\ 3.0\0 \b, Windows 3.X standard mode-style
#>0x187 search/0xB55 WINDOWS\ 386\ 3.0\0 \b, Windows 3.X enhanced mode-style
>0x187 search/0xB55 WINDOWS\ NT\ \ 3.1\0 \b, Windows NT-style
#>0x187 search/0xB55 WINDOWS\ NT\ \ 4.0\0 \b, Windows NT-style
>0x187 search/0xB55 CONFIG\ \ SYS\ 4.0\0 \b +CONFIG.SYS
#>>&06 string x \b:%s
>0x187 search/0xB55 AUTOEXECBAT\ 4.0\0 \b +AUTOEXEC.BAT
#>>&06 string x \b:%s
# Norton Guide (.NG , .HLP) files added by Joerg Jenderek from source NG2HTML.C
# of http://www.davep.org/norton-guides/ng2h-105.tgz
# https://en.wikipedia.org/wiki/Norton_Guides
0 string NG\0\001
# only value 0x100 found at offset 2
>2 ulelong 0x00000100 Norton Guide
!:mime application/x-norton-guide
# often like NORTON.NG but some times like NC.HLP
!:ext ng/hlp
# Title[40]
>>8 string >\0 "%-.40s"
#>>6 uleshort x \b, MenuCount=%u
# szCredits[5][66]
>>48 string >\0 \b, %-.66s
>>114 string >\0 %-.66s
# URL: https://en.wikipedia.org/wiki/Norton_Commander
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/m/msg-nc-eng.trid.xml
# From: Joerg Jenderek
# Note: Message file is used by executable with same main name.
# Only tested with version 5.50 (english) and 2.01 (Windows)
0 string Abort
# \0 or i
#>5 ubyte x %x
# skip ASCII Abort text by looking for error message like in NCVIEW.MSG
>6 search/7089 Non-DOS\ disk Norton Commander module message
!:mime application/x-norton-msg
!:ext msg
# URL: http://www.antonis.de/dos/dos-tuts/mpdostip/html/nwdostip.htm
# Reference: https://mark0.net/download/triddefs_xml.7z/defs/m/msg-netware-dos.trid.xml
# From: Joerg Jenderek
0 string DOS\ Client\ Message\ File: Novell DOS client message
#!:mime application/octet-stream
#!:mime application/x-novell-msg
!:ext msg
# look for second letter instead space character
>26 ubyte >0x20
# digit 1 or often main or program name like: IPXODI.COM TASKID pnwtrap DOSRqstr
>>25 ubyte !0x20 %c
>>>26 ubyte !0x20 \b%c
>>>>27 ubyte !0x20 \b%c
>>>>>28 ubyte !0x20 \b%c
>>>>>>29 ubyte !0x20 \b%c
>>>>>>>30 ubyte !0x20 \b%c
>>>>>>>>31 ubyte !0x20 \b%c
>>>>>>>>>32 ubyte !0x20 \b%c
>>>>>>>>>>33 ubyte !0x20 \b%c
>>>>>>>>>>>34 ubyte !0x20 \b%c
>>>>>>>>>>>>35 ubyte !0x20 \b%c
>>>>>>>>>>>>>36 ubyte !0x20 \b%c
# followed by string like: 0 v.10 V1.20
#
# followed by ,\040Tran
>28 search/14 ,\040Tran
# probably translated version string like: 0 v1.00
>>&0 string x \b, tran version %s
# followed by Ctrl-J Ctrl-Z
>>>&0 ubyte !0xa \b, terminated by %#2.2x
>>>>&0 ubyte x \b%2.2x
# Ctrl-Z
>0x65 ubyte !0x1A \b, at 0x65 %#x
# one
>0x66 ubyte !0x01 \b, at 0x66 %#x
# URL: https://en.wikipedia.org/wiki/NetWare
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/d/dat-novell-msg.trid.xml
# ftp://ftp.iitb.ac.in/LDP/en/NLM-HOWTO/NLM-HOWTO-single.html
# From: Joerg Jenderek
0 string Novell\ Message\ Librarian\ Data\ File Novell message librarian data
#>35 string Version\ 1.00
#>49 string COPYRIGHT\ (c)\ 1985\ by\ Novell,\ Inc.
#>83 string \ \ All\ Rights\ Reserved
#!:mime application/octet-stream
#!:mime application/x-novell-msg
!:ext msg
#!:ext msg/dat
# Summary: Turbo Pascal Help
# From: Joerg Jenderek
# URL: https://en.wikipedia.org/wiki/Turbo_Pascal
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/h/hlp-tp-2.trid.xml
# Note: called "Turbo Pascal Help (v2)" by TrID
0 string TPH2 Turbo Pascal help, version 2
#!:mime application/octet-stream
!:mime application/x-pascal-hlp
# 4DOS help file, version 1.00 3.30
!:ext hlp
# URL: https://en.wikipedia.org/wiki/4DOS
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/h/hlp-4dos-v2.trid.xml
# Note: called "4DOS Help (v2)" by TrID
0 string ALIAS\r\nASSIGN\r\n
>13 search/3016 4DOS 4DOS help file, version 2.x
#!:mime text/plain
!:mime application/x-4dos-hlp
# DOS.HLP 4DOS help file, version 2.21
!:ext hlp
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/h/hlp-4dos-v4.trid.xml
# Note: called "4DOS Help (v4)" by TrID
0 string 4DH4 4DOS help file, version 4.x
#!:mime application/octet-stream
!:mime application/x-4dos-hlp
# 4dos402b.hlp
!:ext hlp
# Reference: https://4dos.info/4dsource/4helpsrc.zip/TPHELP.PAS
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/h/hlp-4dos.trid.xml
# 4DOS help (.HLP) files added by Joerg Jenderek from source TPHELP.PAS
# of https://www.4dos.info/
# check for valid pascal string length (6 or 8) of HelpID, 4DH magic, valid major number (5 6 7 8)
0 ubequad&0xF1ffFFffF0000000 0x0034444830000000 4DOS help file
#!:mime application/octet-stream
!:mime application/x-4dos-hlp
!:ext hlp
# pascal string length of of HelpID like: 6 8
#>0 ubyte x PLENGHT=%x
# Note: version string correspond or is a little bit lower than value of _4VER variable or output of 4DOS command `VER /R`
# one-digit major version number of version string
>4 string x \b, version %-1.1s
# two-digit minor version number depending on pascal string length at the beginning
>>0 ubyte 8 \b.
>>>5 string x \b%-2.2s
# Byte at offset 7 (A=41h) and 8 (A=41h) is not Revison like C (=43h) as reported by VER /R for 4DOS602b.HLP
# GRR: maybe this is patch level
>>>7 string x %-.2s
# few samples with string length 6 (implying exact 2 byte minor version digits) like in 4DOS500f.HLP 4dos551c_ge.hlp
>>0 ubyte 6 \b.
>>>5 string x \b%-2.2s
# just in case pascal string length is neither 6 nor 8
#>>0 default x \b.
#>>>5 string x %-2.2s
# false for version 5.52 and older, but true for version 6.02 and newer
>4 ubeshort >0x3535
# HighestTopic; highest topic number
#>>9 uleshort x HighestTopic=%#4.4x
# NumTopics; number of topics
#>>11 uleshort x NumTopics=%#4.4x
# BiggestTopic; size of largest topic in uncompressed bytes
#>>13 uleshort x BiggestTopic=%#4.4x
# NamedTopics; number of topics in help index
#>>15 uleshort x NamedTopics=%#4.4x
# NameSize; Size of largest name, 0 for none
#>>17 uleshort x NameSize=%#4.4x
# PickSize; size of each entry in pick table, 0 for none
#>>18 uleshort x PickSize=%#4.4x
# width; width of help window, with frame if any
#>>19 ubyte x Width=%#2.2x
# FirstTopic; topic to show first (0 = index)
#>>20 uleshort x FirstTopic=%#4.4x
# KeysTopic; topic to show when keys help needed
#>>22 uleshort x KeysTopic=%#4.4x
# ExtHelpName; string[13]; name for external help program like: HELP.COM DOSBOOK.EXE
>>24 pstring x \b, external help %s
# ExtHelpEnv; String[16]; environment variable for alternate external help program name like: DOSHELP
>>38 pstring x or specified by DOS environment variable %s
# XlateArray = array[0..29] of Byte; {Most common characters in help text}
#>>55 ubequad x XlateArray=%#16.16llx
# SharewareData : SharewareDataRec; shareware info for 4DOS.COM
#>>87 ubequad x SharewareData=%#16.16llx
# old binary Microsoft (.HLP) files added by Joerg Jenderek from http://file-extension.net/seeker/file_extension_hlp
# URL: http://fileformats.archiveteam.org/wiki/Microsoft_Advisor_Help
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/h/hlp-ms-adv.trid.xml
# Note: called "Microsoft Advisor Help" by TrID
0 ulequad&0xFFffFFfeFFffFFff 0x003a000000024e4c MS Advisor help file
#!:mime application/octet-stream
!:mime application/x-ms-hlp
!:ext hlp
# HtmlHelp files (.chm)
0 string/b ITSF\003\000\000\000\x60\000\000\000 MS Windows HtmlHelp Data
!:mime application/vnd.ms-htmlhelp
!:ext chm
# GFA-BASIC (Wolfram Kleff)
2 string/b GFA-BASIC3 GFA-BASIC 3 data
#------------------------------------------------------------------------------
# From Stuart Caie <kyzer@4u.net> (developer of cabextract)
# Update: Joerg Jenderek
# URL: https://en.wikipedia.org/wiki/Cabinet_(file_format)
# Reference: https://msdn.microsoft.com/en-us/library/bb267310.aspx
# Note: verified by `7z l *.cab`
# Microsoft Cabinet files
0 string/b MSCF\0\0\0\0 Microsoft Cabinet archive data
#
# https://support.microsoft.com/en-us/help/973559/frequently-asked-questions-about-the-microsoft-support-diagnostic-tool
# CAB with *.{diagcfg,diagpkg} is used by Microsoft Support Diagnostic Tool MSDT.EXE
# because some archive does not have *.diag* as 1st or 2nd archive member like
# O15CTRRemove.diagcab or AzureStorageAnalyticsLogs_global.DiagCab
# brute looking after header for filenames with diagcfg or diagpkg extension in CFFILE section
>0x2c search/980/c .diag \b, Diagnostic
!:mime application/vnd.ms-cab-compressed
!:ext diagcab
# http://fileformats.archiveteam.org/wiki/PUZ
# Microsoft Publisher version about 2003 has a "Pack and Go" feature that
# bundles a Publisher document *PNG.pub with all links into a CAB
>0x2c search/300/c png.pub\0 \b, Publisher Packed and Go
!:mime application/vnd.ms-cab-compressed
!:ext puz
# ppz variant with Microsoft PowerPoint Viewer ppview32.exe to play PowerPoint presentation
>0x2c search/17/c ppview32.exe\0 \b, PowerPoint Viewer Packed and Go
!:mime application/vnd.ms-powerpoint
#!:mime application/mspowerpoint
!:ext ppz
# URL: https://en.wikipedia.org/wiki/Windows_Desktop_Gadgets
# Reference: https://docs.microsoft.com/en-us/previous-versions/windows/desktop/sidebar/
# http://win10gadgets.com/download/273/ All_CPU_Meter1.zip/All_CPU_Meter_V4.7.3.gadget
>0x2c search/968/c gadget.xml \b, Windows Desktop Gadget
#!:mime application/vnd.ms-cab-compressed
# http://extension.nirsoft.net/gadget
!:mime application/x-windows-gadget
!:ext gadget
# http://www.incredimail.com/
# IncrediMail CAB contains an initialisation file "content.ini" like in im2.ims
>0x2c search/3369/c content.ini\0 \b, IncrediMail
!:mime application/x-incredimail
# member Flavor.htm implies IncrediMail ecard like in tell_a_friend.imf
>>0x2c search/83/c Flavor.htm\0 ecard
!:ext imf
# member Macromedia Flash data *.swf implies IncrediMail skin like in im2.ims
>>0x2c search/211/c .swf\0 skin
!:ext ims
# member anim.im3 implies IncrediMail animation like in letter_fold.ima
>>0x2c search/92/c anim.im3\0 animation
!:ext ima
# other IncrediMail cab archive
>>0x2c default x
>>>0x2c search/116/c thumb ecard, image, notifier or skin
!:ext imf/imi/imn/ims
# http://file-extension.net/seeker/file_extension_ime
>>>0x2c default x emoticons or sound
!:ext ime/imw
# no Diagnostic, Packed and Go, Windows Desktop Gadget, IncrediMail
>0x2c default x
# look for 1st member name
>>(16.l+16) ubyte x
# From: Joerg Jenderek
# URL: https://docs.microsoft.com/en-us/windows-hardware/drivers/install/building-device-metadata-packages
# Reference: http://mark0.net/download/triddefs_xml.7z/defs/d/devicemetadata-ms.trid.xml
>>>&-1 string PackageInfo.xml \b, Device Metadata Package
!:mime application/vnd.ms-cab-compressed
!:ext devicemetadata-ms
# https://en.wikipedia.org/wiki/SNP_file_format
>>>&-1 string/c _accrpt_.snp \b, Access report snapshot
!:mime application/msaccess
!:ext snp
# https://en.wikipedia.org/wiki/Microsoft_InfoPath
>>>&-1 string manifest.xsf \b, InfoPath Form Template
!:mime application/vnd.ms-cab-compressed
#!:mime application/vnd.ms-infopath
!:ext xsn
# https://www.cabextract.org.uk/wince_cab_format/
# extension of DOS 8+3 name with ".000" of 1st archive member name implies Windows CE installer
>>>&7 string =.000 \b, WinCE install
!:mime application/vnd.ms-cab-compressed
!:ext cab
# https://support.microsoft.com/kb/934307/en-US
# All inspected MSU contain a file with name WSUSSCAN.cab
# that is called "Windows Update meta data" by Microsoft
>>>&-1 string/c wsusscan.cab \b, Microsoft Standalone Update
!:mime application/vnd.ms-cab-compressed
!:ext msu
>>>&-1 default x
# look at point character of 1st archive member name for file name extension
# GRR: search range is maybe too large and match point else where like in EN600x64.cab!
>>>>&-1 search/255 .
# http://www.pptfaq.com/FAQ00164_What_is_a_PPZ_file-.htm
# PPZ were created using Pack & Go feature of PowerPoint versions 97 - 2002
# packs optional files, a PowerPoint presentation *.ppt with optional PLAYLIST.LST to CAB
>>>>>&0 string/c ppt\0
>>>>>>28 uleshort >1 \b, PowerPoint Packed and Go
!:mime application/vnd.ms-powerpoint
#!:mime application/mspowerpoint
!:ext ppz
# or POWERPNT.PPT packed as POWERPNT.PP_ found on Windows 2000,XP setup CD in directory i386
>>>>>>28 uleshort =1 \b, one packed PowerPoint
!:mime application/vnd.ms-cab-compressed
!:ext pp_
# https://msdn.microsoft.com/en-us/library/windows/desktop/bb773190(v=vs.85).aspx
# first member *.theme implies Windows 7 Theme Pack like in CommunityShowcaseAqua3.themepack
# or Windows 8 Desktop Theme Pack like in PanoramicGlaciers.deskthemepack
>>>>>&0 string/c theme \b, Windows
!:mime application/x-windows-themepack
# https://www.drewkeller.com/content/using-theme-both-windows-7-and-windows-8
# 1st member Panoramic.theme or Panoramas.theme implies Windows 8-10 Theme Pack
# with MTSM=RJSPBS in [MasterThemeSelector] inside *.theme
>>>>>>(16.l+16) string =Panoram 8
!:ext deskthemepack
>>>>>>(16.l+16) string !Panoram 7 or 8
!:ext themepack/deskthemepack
>>>>>>(16.l+16) ubyte x Theme Pack
# URL: https://en.wikipedia.org/wiki/Microsoft_OneNote#File_format
# http://fileformats.archiveteam.org/wiki/OneNote
# Reference: https://mark0.net/download/triddefs_xml.7z/defs/o/onepkg.trid.xml
# 1st member name like: "Class Notes.one" "test-onenote.one" "Open Notebook.onetoc2" "Editor <20>ffnen.onetoc2"
>>>>>&0 string/c one \b, OneNote Package
!:mime application/msonenote
!:ext onepkg
>>>>>&0 default x
# look for null terminator of 1st member name
>>>>>>&0 search/255 \0
# 2nd member name WSUSSCAN.cab like in Microsoft-Windows-MediaFeaturePack-OOB-Package.msu
>>>>>>>&16 string/c wsusscan.cab \b, Microsoft Standalone Update
!:mime application/vnd.ms-cab-compressed
!:ext msu
>>>>>>>&16 default x
# archive with more then one file need some output in version 5.32 to avoid error message like
# Magdir/msdos, 1138: Warning: Current entry does not yet have a description for adding a MIME type
# Magdir/msdos, 1139: Warning: Current entry does not yet have a description for adding a EXTENSION type
# file: could not find any valid magic files!
>>>>>>>>28 uleshort >1 \b, many
!:mime application/vnd.ms-cab-compressed
!:ext cab
# remaining archives with just one file
>>>>>>>>28 uleshort =1
# neither extra bytes nor cab chain implies Windows 2000,XP setup files in directory i386
>>>>>>>>>30 uleshort =0x0000 \b, Windows 2000/XP setup
# cut of last char of source extension and add underscore to generate extension
# TERMCAP._ ... FXSCOUNT.H_ ... L3CODECA.AC_ ... NPDRMV2.ZI_
!:mime application/vnd.ms-cab-compressed
!:ext _/?_/??_
# archive need some output like "single" in version 5.32 to avoid error messages
>>>>>>>>>30 uleshort !0x0000 \b, single
!:mime application/vnd.ms-cab-compressed
!:ext cab
# first archive name without point character
>>>>&-1 default x
>>>>>28 uleshort =1 \b, single
!:mime application/vnd.ms-cab-compressed
# on XP_CD\I386\ like: NETWORKS._ PROTOCOL._ QUOTES._ SERVICES._
!:ext _
>>>>>28 uleshort >1 \b, many
!:mime application/vnd.ms-cab-compressed
# like: HP Envy 6000 printer driver packages Full_x86.cab Full_x64.cab
!:ext cab
# TODO: additional extensions like
# .xtp InfoPath Template Part
# .lvf Logitech Video Effects Face Accessory
>8 ulelong x \b, %u bytes
>28 uleshort 1 \b, 1 file
>28 uleshort >1 \b, %u files
# Reserved fields, set to zero
#>4 belong !0 \b, reserved1 %x
#>12 belong !0 \b, reserved2 %x
# offset of the first CFFILE entry coffFiles: minimal 2Ch
>16 ulelong x \b, at %#x
>(16.l) use cab-file
# at least also 2nd member
>28 uleshort >1
>>(16.l+16) ubyte x
>>>&0 search/255 \0
# second member info
>>>>&0 use cab-file
#>20 belong !0 \b, reserved %x
# Cabinet file format version. Currently, versionMajor = 1 and versionMinor = 3
>24 ubeshort !0x0301 \b version %#x
# number of CFFOLDER entries
>26 uleshort >1 \b, %u cffolders
# cabinet file option indicators 1~PREVIOUS, 2~NEXT, 4~reserved fields
# only found for flags 0 1 2 3 4 not 7
>30 uleshort >0 \b, flags %#x
# Cabinet files have a 16-bit cabinet setID field that is designed for application use.
# default is zero, however, the -i option of cabarc can be used to set this field
>32 uleshort >0 \b, ID %u
# iCabinet is number of this cabinet file in a set, where 0 for the first cabinet
#>34 uleshort x \b, iCabinet %u
# add one for display because humans start numbering by 1 and also fit to name of disk szDisk*
>34 uleshort+1 x \b, number %u
>30 uleshort &0x0004 \b, extra bytes
# cbCFHeader optional size of per-cabinet reserved area 14h 1800h
>>36 uleshort >0 %u in head
# cbCFFolder is optional size of per-folder reserved area
>>38 ubyte >0 %u in folder
# cbCFData is optional size of per-datablock reserved area
>>39 ubyte >0 %u in data block
# optional per-cabinet reserved area abReserve[cbCFHeader]
>>36 uleshort >0
# 1st CFFOLDER after reserved area in header
>>>(36.s+40) use cab-folder
# no reserved area in header
>30 uleshort ^0x0004
# no previous and next cab archive
>>30 uleshort =0x0000
>>>36 use cab-folder
# only previous cab archive
>>30 uleshort =0x0001 \b, previous
>>>36 use cab-anchor
# only next cab archive
>>30 uleshort =0x0002 \b, next
>>>36 use cab-anchor
# previous+next cab archive
# can not use sub routine cab-anchor to display previous and next cabinet together
#>>>36 use cab-anchor
#>>>>&0 use cab-anchor
>>30 uleshort =0x0003 \b, previous
>>>36 string x %s
# optional name of previous disk szDisk*
>>>>&1 string x disk %s
>>>>>&1 string x \b, next %s
# optional name of previous disk szDisk*
>>>>>>&1 string x disk %s
>>>>>>>&1 use cab-folder
# display filename and disk name of previous or next cabinet
0 name cab-anchor
# optional name of previous/next cabinet file szCabinet*[255]
>&0 string x %s
# optional name of previous/next disk szDisk*[255]
>>&1 string x disk %s
# display folder structure CFFOLDER information like compression of cabinet
0 name cab-folder
# offset of the CFDATA block in this folder
#>0 ulelong x \b, coffCabStart %#x
# number of CFDATA blocks in folder
>4 uleshort x \b, %u datablock
# plural s
>4 uleshort >1 \bs
# compression typeCompress: 0~None 1~MSZIP 0x1503~LZX:21 0x1003~LZX:16 0x0f03~LZX:15
>6 uleshort x \b, %#x compression
# optional per-folder reserved area
#>8 ubequad x \b, abReserve %#llx
# display member structure CFFILE information like member name of cabinet
0 name cab-file
# cbFile is uncompressed size of file in bytes
#>0 ulelong x \b, cbFile %u
# uoffFolderStart is uncompressed offset of file in folder
#>4 ulelong >0 \b, uoffFolderStart %#x
# iFolder is index into the CFFOLDER area. 0 indicates first folder in cabinet
# define ifoldCONTINUED_FROM_PREV (0xFFFD)
# define ifoldCONTINUED_TO_NEXT (0xFFFE)
# define ifoldCONTINUED_PREV_AND_NEXT (0xFFFF)
>8 uleshort >0 \b, iFolder %#x
# date stamp for file
>10 lemsdosdate x last modified %s
# time stamp for file
>12 lemsdostime x %s
# attribs is attribute flags for file
# define _A_RDONLY (0x01) file is read-only
# define _A_HIDDEN (0x02) file is hidden
# define _A_SYSTEM (0x04) file is a system file
# define _A_ARCH (0x20) file modified since last backup
# example http://sebastien.kirche.free.fr/pebuilder_plugins/depends.cab
# define _A_EXEC (0x40) run after extraction
# define _A_NAME_IS_UTF (0x80) szName[] contains UTF
# define UNKNOWN (0x0100) undocumented or accident
#>14 uleshort x \b, attribs %#x
>14 uleshort >0 +
>>14 uleshort &0x0001 \bR
>>14 uleshort &0x0002 \bH
>>14 uleshort &0x0004 \bS
>>14 uleshort &0x0020 \bA
>>14 uleshort &0x0040 \bX
>>14 uleshort &0x0080 \bUtf
# unknown 0x0100 flag found on one XP_CD:\I386\DRIVER.CAB
>>14 uleshort &0x0100 \b?
# szName is name of archive member
>16 string x "%s"
# next archive member name if more files
#>>&17 string >\0 \b, NEXT NAME %-.50s
# InstallShield Cabinet files
0 string/b ISc( InstallShield Cabinet archive data
>5 byte&0xf0 =0x60 version 6,
>5 byte&0xf0 !0x60 version 4/5,
>(12.l+40) lelong x %u files
# Windows CE package files
0 string/b MSCE\0\0\0\0 Microsoft WinCE install header
>20 lelong 0 \b, architecture-independent
>20 lelong 103 \b, Hitachi SH3
>20 lelong 104 \b, Hitachi SH4
>20 lelong 0xA11 \b, StrongARM
>20 lelong 4000 \b, MIPS R4000
>20 lelong 10003 \b, Hitachi SH3
>20 lelong 10004 \b, Hitachi SH3E
>20 lelong 10005 \b, Hitachi SH4
>20 lelong 70001 \b, ARM 7TDMI
>52 leshort 1 \b, 1 file
>52 leshort >1 \b, %u files
>56 leshort 1 \b, 1 registry entry
>56 leshort >1 \b, %u registry entries
# Windows Enhanced Metafile (EMF)
# See msdn.microsoft.com/archive/en-us/dnargdi/html/msdn_enhmeta.asp
# for further information.
0 ulelong 1
>40 string \ EMF Windows Enhanced Metafile (EMF) image data
>>44 ulelong x version %#x
0 string/b \224\246\056 Microsoft Word Document
!:mime application/msword
# From: "Nelson A. de Oliveira" <naoliv@gmail.com>
# Magic type for Dell's BIOS .hdr files
# Dell's .hdr
0 string/b $RBU
>23 string Dell %s system BIOS
>5 byte 2
>>48 byte x version %d.
>>49 byte x \b%d.
>>50 byte x \b%d
>5 byte <2
>>48 string x version %.3s
# Type: Microsoft Document Imaging Format (.mdi)
# URL: https://en.wikipedia.org/wiki/Microsoft_Document_Imaging_Format
# From: Daniele Sempione <scrows@oziosi.org>
# Too weak (EP)
#0 short 0x5045 Microsoft Document Imaging Format
# MS eBook format (.lit)
0 string/b ITOLITLS Microsoft Reader eBook Data
>8 lelong x \b, version %u
!:mime application/x-ms-reader
# Windows CE Binary Image Data Format
# From: Dr. Jesus <j@hug.gs>
0 string/b B000FF\n Windows Embedded CE binary image
# The second byte of these signatures is a file version; I don't know what,
# if anything, produced files with version numbers 0-2.
# From: John Elliott <johne@seasip.demon.co.uk>
0 string \xfc\x03\x00 Mallard BASIC program data (v1.11)
0 string \xfc\x04\x00 Mallard BASIC program data (v1.29+)
0 string \xfc\x03\x01 Mallard BASIC protected program data (v1.11)
0 string \xfc\x04\x01 Mallard BASIC protected program data (v1.29+)
0 string MIOPEN Mallard BASIC Jetsam data
0 string Jetsam0 Mallard BASIC Jetsam index data
# DOS backup 2.0 to 3.2
# URL: http://fileformats.archiveteam.org/wiki/BACKUP_(MS-DOS)
# Reference: http://www.ibiblio.org/pub/micro/pc-stuff/freedos/files/dos/restore/brtecdoc.htm
# backupid.@@@
# plausibility check for date
0x3 ushort >1979
>0x5 ubyte-1 <31
>>0x6 ubyte-1 <12
# actually 121 nul bytes
>>>0x7 string \0\0\0\0\0\0\0\0
>>>>0x1 ubyte x DOS 2.0 backup id file, sequence %d
#!:mime application/octet-stream
!:ext @@@
>>>>0x0 ubyte 0xff \b, last disk
# backed up file
# skip some AppleWorks word like Tomahawk.Awp, WIN98SE-DE.vhd
# by looking for trailing nul of maximal file name string
0x52 ubyte 0
# test for flag byte: FFh~complete file, 00h~split file
# FFh -127 = -1 -127 = -128
# 00h -127 = 0 -127 = -127
>0 byte-127 <-126
# plausibility check for file name length
>>0x53 ubyte-1 <78
# looking for terminating nul of file name string
>>>(0x53.b+4) ubyte 0
# looking if last char of string is valid DOS file name
>>>>(0x53.b+3) ubyte >0x1F
# actually 44 nul bytes
# but sometimes garbage according to Ralf Quint. So can not be used as test
#>0x54 string \0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0
# first char of full file name is DOS (5Ch) or UNIX (2Fh) path separator
# only DOS variant found. UNIX variant according to V32SLASH.TXT in archive PD0315.EXE
>>>>>5 ubyte&0x8C 0x0C
# ./msdos (version 5.30) labeled the entry as
# "DOS 2.0 backed up file %s, split file, sequence %d" or
# "DOS 2.0 backed up file %s, complete file"
>>>>>>0 ubyte x DOS 2.0-3.2 backed up
#>>>>>>0 ubyte 0xff complete
>>>>>>0 ubyte 0
>>>>>>>1 uleshort x sequence %d of
# full file name with path but without drive letter and colon stored from 0x05 til 0x52
>>>>>>0x5 string x file %s
#!:mime application/octet-stream
# backup name is original filename
#!:ext doc/exe/rar/zip
#!:ext *
# magic/Magdir/msdos, 1169: Warning: EXTENSION type ` *' has bad char '*'
# file: line 1169: Bad magic entry ' *'
# after header original file content
>>>>>>128 indirect x \b;
# DOS backup 3.3 to 5.x
# CONTROL.nnn files
0 string \x8bBACKUP\x20
# actually 128 nul bytes
>0xa string \0\0\0\0\0\0\0\0
>>0x9 ubyte x DOS 3.3 backup control file, sequence %d
>>0x8a ubyte 0xff \b, last disk
# NB: The BACKUP.nnn files consist of the files backed up,
# concatenated.
# From: Joerg Jenderek
# URL: http://fileformats.archiveteam.org/wiki/MS-DOS_date/time
# Reference: https://docs.microsoft.com/en-us/windows/win32/api/winbase/nf-winbase-dosdatetimetofiletime
# Note: DOS date+time format is different from formats such as Unix epoch
# bit encoded; uses year values relative to 1980 and 2 second precision
0 name dos-date
# HHHHHMMMMMMSSSSS bit encoded Hour (0-23) Minute (0-59) SecondPart (*2)
#>0 uleshort x RAW TIME [%#4.4x]
# hour part
#>0 uleshort/2048 x hour [%u]
# YYYYYMMMMDDDDD bit encoded YearPart (+1980) Month (1-12) Day (1-31)
#>2 uleshort x RAW DATE [%#4.4x]
# day part
>2 uleshort&0x001F x %u
#>2 uleshort/16 x MONTH PART [%#x]
# GRR: not working
#>2 uleshort/16 &0x000F MONTH [%u]
#>2 uleshort&0x01E0 x MONTH PART [%#4.4x]
>2 uleshort&0x01E0 =0x0020 jan
>2 uleshort&0x01E0 =0x0040 feb
>2 uleshort&0x01E0 =0x0060 mar
>2 uleshort&0x01E0 =0x0080 apr
>2 uleshort&0x01E0 =0x00A0 may
>2 uleshort&0x01E0 =0x00C0 jun
>2 uleshort&0x01E0 =0x00E0 jul
>2 uleshort&0x01E0 =0x0100 aug
>2 uleshort&0x01E0 =0x0120 sep
>2 uleshort&0x01E0 =0x0140 oct
>2 uleshort&0x01E0 =0x0160 nov
>2 uleshort&0x01E0 =0x0180 dec
# year part
>2 uleshort/512 x 1980+%u
#
# ExcelBIFF2-8BOF.magic - Excel Binary Interchange File Format versions 2-8
# Beginning of File records
# See https://www.gaia-gis.it/gaia-sins/freexl-1.0.6-doxy-doc/html/Format.html
# Excel Commercial BIFF Release
# Version Name Version Year Notes
# 2.x Excel 2.0 BIFF2 1987 Before CFBF. File is the BIFF
# stream, containing a single
# worksheet.
# 3.0 Excel 3.0 BIFF3 1990 ""
# 4.0 Excel 4.0 BIFF4 1992 ""
# 5.0 Excel 5.0 BIFF5 1993 Starting with BIFF5, a single
# Workbook can internally store
# many individual Worksheets.
# The BIFF stream is stored in
# the CFBF file container.
# 7.0 Excel 95 BIFF5 1995
# 8.0 Excel 98 BIFF8 1998
# 9.0 Excel 2000 BIFF8 1999
# 10.0 Excel XP BIFF8 2001
# 11.0 Excel 2003 BIFF8 2003
# See https://www.openoffice.org/sc/excelfileformat.pdf#page=135
# 5.8 BOF Beginning of File
# See also https://en.wikipedia.org/wiki/Microsoft_Excel;
# Old file extensions
# Format Extension Description
# Spreadsheet .xls Main spreadsheet format which holds data in
# worksheets, charts, and macros
# Add-in (VBA) .xla Adds custom functionality; written in VBA
# Toolbar .xlb The file extension where Microsoft Excel custom
# toolbar settings are stored.
# Chart .xlc A chart created with data from a Microsoft Excel
# spreadsheet that only saves the chart.
# To save the chart and spreadsheet save as .XLS.
# XLC is not supported in Excel 2007 or in any
# newer versions of Excel.
# Dialog .xld Used in older versions of Excel.
# Archive .xlk A backup of an Excel Spreadsheet
# Add-in (DLL) .xll Adds custom functionality; written in C++/C,
# Fortran, etc. and compiled in to a special
# dynamic-link library
# Macro .xlm A macro is created by the user or pre-installed
# with Excel.
# Template .xlt A pre-formatted spreadsheet created by the user
# or by Microsoft Excel.
# Module .xlv A module is written in VBA (Visual Basic for
# Applications) for Microsoft Excel
# Workspace .xlw Arrangement of the windows of multiple Workbooks
# Library .DLL Code written in VBA may access functions in a
# DLL, typically this is used to access the
# Windows API
#!:ext xls/xla/xlb/xlc/xld/xlk/xll/xlm/xlt/xlv/xlw
#!:mime application/vnd.ms-excel
# 5.8.1 BOF Records Written by Excel
# Record BOF, BIFF2 (record identifier is 0009 H):
# Offset Size Contents
# 0 2 BIFF version (not used)
# 2 2 Type of the following data: 0010H = Sheet
# 0020H = Chart
# 0040H = Macro sheet
# e.g. 0x0009 BOF len 4 version 2 content 0x0010 Sheet
0 uleshort =0x0009 Excel 2 BIFF 2
>2 uleshort =4
# version
>>4 uleshort =0
>>4 uleshort =2
>>>6 uleshort =0x0010 Sheet
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# Record BOF, BIFF3 (record identifier is 0209 H) and
# BIFF4 (record identifier is 0409H):
# Offset Size Contents
# 0 2 BIFF version (not used)
# 2 2 Type of the following data: 0010H = Sheet
# 0020H = Chart
# 0040H = Macro sheet
# 0100H = Workspace
# (BIFF3W/BIFF4W only)
# 4 2 Not used
0 uleshort =0x0209 Excel 3 BIFF 3
>2 uleshort =6
# version
>>4 uleshort =0
>>4 uleshort =3
>>>6 uleshort =0x0010 Sheet
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# (BIFF3W only)
>>>6 uleshort =0x0100 Workspace
0 uleshort =0x0409 Excel 4 BIFF 4
>2 uleshort =6
# version
>>4 uleshort =0
>>4 uleshort =4
>>>6 uleshort =0x0010 Sheet
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# (BIFF4W only)
>>>6 uleshort =0x0100 Workspace
# Record BOF, BIFF5 (record identifier is 0809 H):
# Offset Size Contents
# 0 2 BIFF version (always 0500H for BIFF5).
# Should only be used, if this record is the leading
# workbook globals BOF (see above).
# 2 2 Type of the following data:
# 0005H = Workbook globals
# 0006H = Visual Basic module
# 0010H = Sheet or dialogue (see SHEETPR,
# ➜5.97)
# 0020H = Chart
# 0040H = Macro sheet
# 0100H = Workspace (BIFF5W only)
# 4 2 Build identifier, must not be 0
# 6 2 Build year
0 uleshort =0x0809 Excel 5 BIFF 5
>2 uleshort =8
# version
>>4 uleshort =0x0500
>>4 uleshort =5
>>4 uleshort =0
>>>6 uleshort =0x0005 Workbook Globals
>>>6 uleshort =0x0006 VB Module
>>>6 uleshort =0x0010 Sheet
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# (BIFF5W only)
>>>6 uleshort =0x0100 Workspace
>>>>8 uleshort >0 Build %d
>>>>>10 uleshort >1900 Year %d
# Record BOF, BIFF8 (record identifier is 0809 H):
# Offset Size Contents
# 0 2 BIFF version (always 0600 H for BIFF8)
# 2 2 Type of the following data:
# 0005H = Workbook globals
# 0006H = Visual Basic module
# 0010H = Sheet or dialogue (see SHEETPR,
# ➜5.97)
# 0020H = Chart
# 0040H = Macro sheet
# 0100H = Workspace (BIFF8W only)
# 4 2 Build identifier, must not be 0
# 6 2 Build year, must not be 0
# 8 4 File history flags
# 12 4 Lowest Excel version that can read all records in this
# file
0 uleshort =0x0809 Excel 8 BIFF 8
>2 uleshort =16
# version
>>4 uleshort =0x0600
>>4 uleshort =8
>>4 uleshort =0
>>>6 uleshort =0x0005 Workbook Globals
>>>6 uleshort =0x0006 VB Module
>>>6 uleshort =0x0010 Sheet
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# (BIFF8W only)
>>>6 uleshort =0x0100 Workspace
>>>>8 uleshort >0 Build %d
>>>>>10 uleshort >1900 Year %d
>>>>>>12 ulelong !0 File history %d
>>>>>>16 ulelong >0 Excel version needed %d
# 5.8.2 BOF Records Written by Other External Tools
# Various external tools write non-standard BOF records with the record
# identifier 0809H (determining a BIFF5-BIFF8 BOF record), but with a
# different BIFF version field. In this case, the record identifier is
# ignored, and only the version field is used to set the BIFF version of
# the workbook.
# Record BOF (record identifier is 0809 H):
# Offset Size Contents
# 0 2 BIFF version: 0000H = BIFF5
# 0200H = BIFF2
# 0300H = BIFF3
# 0400H = BIFF4
# 0500H = BIFF5
# 0600H = BIFF8
# 2 2 Type of the following data:
# 0005H = Workbook globals
# 0006H = Visual Basic module
# 0010H = Sheet or dialogue (see SHEETPR,
# ➜5.97)
# 0020H = Chart
# 0040H = Macro sheet
# 0100H = Workspace
# [4] var. (optional) Additional fields of a BOF record,
# should be ignored
0 uleshort =0x0809
# >= 4
>2 uleshort >3
>>4 uleshort =0 Excel 5 BIFF 5
>>4 uleshort =0x0200 Excel 2 BIFF 2
>>4 uleshort =2 Excel 2 BIFF 2
>>4 uleshort =0x0300 Excel 3 BIFF 3
>>4 uleshort =3 Excel 3 BIFF 3
>>4 uleshort =0x0400 Excel 4 BIFF 4
>>4 uleshort =4 Excel 4 BIFF 4
>>4 uleshort =0x0500 Excel 5 BIFF 5
>>4 uleshort =5 Excel 5 BIFF 5
>>4 uleshort =0x0600 Excel 8 BIFF 8
>>4 uleshort =6 Excel 8 BIFF 8
>>4 uleshort =0x0800 Excel 8 BIFF 8
>>4 uleshort =8 Excel 8 BIFF 8
>>>6 uleshort =0x0005 Workbook Globals
>>>6 uleshort =0x0006 VB Module
>>>6 uleshort =0x0010 Sheet/Dialogue
>>>6 uleshort =0x0020 Chart
>>>6 uleshort =0x0040 Macros
# (BIFF8W only)
>>>6 uleshort =0x0100 Workspace