#!/usr/local/bin/perl
# --- magicdata.pl
# scan the "magic" file for file identification rules
$filename = ($#ARGV>=0) ? $ARGV[0] : 'magic';
open(FILE,"<$filename") || die "Couldn't open file '$filename'";
$i = 0;
while (<FILE>)
{
next if /^\s*#/;# skip comments
next if /^\s*$/;# skip blank lines
s/[\r\n]*//g; # strip trailing cr/lf
# replace octal escape codes
s/\\([0-9]{3})/pack('C',oct($1))/eg;
# split on spaces, except for "\ "
my ($offset,$dt,$cnt,$mime,$encoding) = split(/(?<!\\)\s+/);
$cont = ($offset =~ /^>/) ? 'Y' : undef;
$offset = substr($offset,1) if $cont;
if ($dteq 'string')
{
# generate a HEXTORAW version of the string
$data = join('',map(sprintf('%02X',$_),unpack('C*',$cnt)));
}
else
{
# handle special number formats
if ($cnt =~ /^0x/) { $cnt = hex($cnt); }# hex
elsif ($cnt =~ /^0/) { $cnt = oct($cnt); } # octal
warn "unknown number: '$cnt'" unless $cnt =~ /^([0-9]|[1-9][0-9]*)$/;
if ($dteq 'belong') {
$data = sprintf('%02X' x 4,unpack('C4',pack('N',$cnt)));
} elsif ($dteq 'lelong') {
$data = sprintf('%02X' x 4,unpack('C4',pack('V',$cnt)));
} elsif ($dteq 'beshort' || $dteq 'short') {
$data = sprintf('%02X' x 2,unpack('C2',pack('n',$cnt)));
} elsif ($dteq 'leshort') {
$data = sprintf('%02X' x 2,unpack('C2',pack('v',$cnt)));
} elsif ($dteq 'byte') {
$data = sprintf('%02X',$cnt);
} else {
warn "data type '$dt' not implemented";
}
}
$i++;
print join(',',$i,$cont,$offset,$data,$mime,$encoding),"\n";
}
close(FILE);
$ perl magicdata.pl $ORACLE_HOME/Apache/conf/magic > magicdata.dat |