Chilkat HOME Android™ AutoIt C C# C++ Chilkat2-Python CkPython Classic ASP DataFlex Delphi DLL Go Java Node.js Objective-C PHP Extension Perl PowerBuilder PowerShell PureBasic Ruby SQL Server Swift Tcl Unicode C Unicode C++ VB.NET VBScript Visual Basic 6.0 Visual FoxPro Xojo Plugin
(Perl) Determine File Type from Binary Content of FileNote: This example requires Chilkat v9.5.0.64 or later. Many file types have "signatures" (leading bytes) that signify the type of file. It allows for programs to identify the likely type of file given the first few bytes contained within the file. This example shows how to identify a few common types files. For other file types, you can do a short bit of investigative work by examining the first few bytes of an sample file, and searching the Internet for information about the file type. Use this same technique for handling other file types that have leading "signature" bytes.
use chilkat(); # Note: This example requires Chilkat v9.5.0.64 or later. # To identify a file by the first few bytes, we'll load a few bytes from the start # of the file, and then examine the bytes as both hex and quoted-printable. $fac = chilkat::CkFileAccess->new(); # A JPG file. $jpgData = chilkat::CkBinData->new(); $fac->OpenForRead("qa_data/jpg/starfish.jpg"); # The the first 8 bytes of the JPG file. $fac->FileReadBd(8,$jpgData); $fac->FileClose(); # JPG hex: FFD8FFE000104A46 # JPG qp: =FF=D8=FF=E0=00=10JF print "JPG hex: " . $jpgData->getEncoded("hex") . "\r\n"; print "JPG qp: " . $jpgData->getEncoded("qp") . "\r\n"; # A JPG begins with the following two bytes: 0xFF, 0xD8 # Your program can check to see if the hex string begins with "FFD8", or if the qp string begins with "=FF=D8". # ---------------------------------------- # A PNG file. $pngData = chilkat::CkBinData->new(); $fac->OpenForRead("qa_data/png/anemone.png"); # The the first 8 bytes of the PNG file. $fac->FileReadBd(8,$pngData); $fac->FileClose(); # PNG hex: 89504E470D0A1A0A # PNG qp: =89PNG=1A=0A print "PNG hex: " . $pngData->getEncoded("hex") . "\r\n"; print "PNG qp: " . $pngData->getEncoded("qp") . "\r\n"; # A PNG file begins with the byte 0x89, followed by the us-ascii bytes "PNG". # ---------------------------------------- # A PDF file. $pdfData = chilkat::CkBinData->new(); $fac->OpenForRead("qa_data/pdf/fishing.pdf"); # The the first 8 bytes of the PDF file. $fac->FileReadBd(8,$pdfData); $fac->FileClose(); # PDF hex: 255044462D312E33 # PDF qp: %PDF-1.3 print "PDF hex: " . $pdfData->getEncoded("hex") . "\r\n"; print "PDF qp: " . $pdfData->getEncoded("qp") . "\r\n"; # A PDF file begins with the us-ascii chars "%PDF" # ---------------------------------------- # A Zip file. $zipData = chilkat::CkBinData->new(); $fac->OpenForRead("qa_data/zips/test.zip"); # The the first 8 bytes of the Zip file. $fac->FileReadBd(8,$zipData); $fac->FileClose(); # PDF hex: 504B030414000000 # PDF qp: PK=03=04=14=00=00=00 print "PDF hex: " . $zipData->getEncoded("hex") . "\r\n"; print "PDF qp: " . $zipData->getEncoded("qp") . "\r\n"; # A Zip archive begins with the us-ascii chars "PK" followed by the bytes 0x03, 0x04. |
© 2000-2025 Chilkat Software, Inc. All Rights Reserved.