[3318] | 1 | <?php |
---|
| 2 | // +----------------------------------------------------------------------+ |
---|
| 3 | // | PHP version 5 | |
---|
| 4 | // +----------------------------------------------------------------------+ |
---|
| 5 | // | Copyright (c) 2002-2006 James Heinrich, Allan Hansen | |
---|
| 6 | // +----------------------------------------------------------------------+ |
---|
| 7 | // | This source file is subject to version 2 of the GPL license, | |
---|
| 8 | // | that is bundled with this package in the file license.txt and is | |
---|
| 9 | // | available through the world-wide-web at the following url: | |
---|
| 10 | // | http://www.gnu.org/copyleft/gpl.html | |
---|
| 11 | // +----------------------------------------------------------------------+ |
---|
| 12 | // | getID3() - http://getid3.sourceforge.net or http://www.getid3.org | |
---|
| 13 | // +----------------------------------------------------------------------+ |
---|
| 14 | // | Authors: James Heinrich <infoØgetid3*org> | |
---|
| 15 | // | Allan Hansen <ahØartemis*dk> | |
---|
| 16 | // +----------------------------------------------------------------------+ |
---|
| 17 | // | module.archive.gzip.php | |
---|
| 18 | // | module for analyzing GZIP files | |
---|
| 19 | // | dependencies: PHP compiled with zlib support (optional) | |
---|
| 20 | // +----------------------------------------------------------------------+ |
---|
| 21 | // | Module originally written by Mike Mozolin <teddybearØmail*ru> | |
---|
| 22 | // +----------------------------------------------------------------------+ |
---|
| 23 | // |
---|
| 24 | // $Id: module.archive.gzip.php 3318 2009-05-20 21:54:10Z vdigital $ |
---|
| 25 | |
---|
| 26 | |
---|
| 27 | |
---|
| 28 | class getid3_gzip extends getid3_handler |
---|
| 29 | { |
---|
| 30 | |
---|
| 31 | // public: Optional file list - disable for speed. |
---|
| 32 | public $option_gzip_parse_contents = true; // decode gzipped files, if possible, and parse recursively (.tar.gz for example) |
---|
| 33 | |
---|
| 34 | |
---|
| 35 | // Reads the gzip-file |
---|
| 36 | function Analyze() { |
---|
| 37 | |
---|
| 38 | $info = &$this->getid3->info; |
---|
| 39 | |
---|
| 40 | $info['fileformat'] = 'gzip'; |
---|
| 41 | |
---|
| 42 | $start_length = 10; |
---|
| 43 | $unpack_header = 'a1id1/a1id2/a1cmethod/a1flags/a4mtime/a1xflags/a1os'; |
---|
| 44 | |
---|
| 45 | //+---+---+---+---+---+---+---+---+---+---+ |
---|
| 46 | //|ID1|ID2|CM |FLG| MTIME |XFL|OS | |
---|
| 47 | //+---+---+---+---+---+---+---+---+---+---+ |
---|
| 48 | |
---|
| 49 | @fseek($this->getid3->fp, 0); |
---|
| 50 | $buffer = @fread($this->getid3->fp, $info['filesize']); |
---|
| 51 | |
---|
| 52 | $arr_members = explode("\x1F\x8B\x08", $buffer); |
---|
| 53 | |
---|
| 54 | while (true) { |
---|
| 55 | $is_wrong_members = false; |
---|
| 56 | $num_members = intval(count($arr_members)); |
---|
| 57 | for ($i = 0; $i < $num_members; $i++) { |
---|
| 58 | if (strlen($arr_members[$i]) == 0) { |
---|
| 59 | continue; |
---|
| 60 | } |
---|
| 61 | $buf = "\x1F\x8B\x08".$arr_members[$i]; |
---|
| 62 | |
---|
| 63 | $attr = unpack($unpack_header, substr($buf, 0, $start_length)); |
---|
| 64 | if (!$this->get_os_type(ord($attr['os']))) { |
---|
| 65 | |
---|
| 66 | // Merge member with previous if wrong OS type |
---|
| 67 | $arr_members[$i - 1] .= $buf; |
---|
| 68 | $arr_members[$i] = ''; |
---|
| 69 | $is_wrong_members = true; |
---|
| 70 | continue; |
---|
| 71 | } |
---|
| 72 | } |
---|
| 73 | if (!$is_wrong_members) { |
---|
| 74 | break; |
---|
| 75 | } |
---|
| 76 | } |
---|
| 77 | |
---|
| 78 | $fpointer = 0; |
---|
| 79 | $idx = 0; |
---|
| 80 | for ($i = 0; $i < $num_members; $i++) { |
---|
| 81 | if (strlen($arr_members[$i]) == 0) { |
---|
| 82 | continue; |
---|
| 83 | } |
---|
| 84 | $info_gzip_member_header_idx = &$info['gzip']['member_header'][++$idx]; |
---|
| 85 | |
---|
| 86 | $buff = "\x1F\x8B\x08".$arr_members[$i]; |
---|
| 87 | |
---|
| 88 | $attr = unpack($unpack_header, substr($buff, 0, $start_length)); |
---|
| 89 | $info_gzip_member_header_idx['filemtime'] = getid3_lib::LittleEndian2Int($attr['mtime']); |
---|
| 90 | $info_gzip_member_header_idx['raw']['id1'] = ord($attr['cmethod']); |
---|
| 91 | $info_gzip_member_header_idx['raw']['id2'] = ord($attr['cmethod']); |
---|
| 92 | $info_gzip_member_header_idx['raw']['cmethod'] = ord($attr['cmethod']); |
---|
| 93 | $info_gzip_member_header_idx['raw']['os'] = ord($attr['os']); |
---|
| 94 | $info_gzip_member_header_idx['raw']['xflags'] = ord($attr['xflags']); |
---|
| 95 | $info_gzip_member_header_idx['raw']['flags'] = ord($attr['flags']); |
---|
| 96 | |
---|
| 97 | $info_gzip_member_header_idx['flags']['crc16'] = (bool) ($info_gzip_member_header_idx['raw']['flags'] & 0x02); |
---|
| 98 | $info_gzip_member_header_idx['flags']['extra'] = (bool) ($info_gzip_member_header_idx['raw']['flags'] & 0x04); |
---|
| 99 | $info_gzip_member_header_idx['flags']['filename'] = (bool) ($info_gzip_member_header_idx['raw']['flags'] & 0x08); |
---|
| 100 | $info_gzip_member_header_idx['flags']['comment'] = (bool) ($info_gzip_member_header_idx['raw']['flags'] & 0x10); |
---|
| 101 | |
---|
| 102 | $info_gzip_member_header_idx['compression'] = $this->get_xflag_type($info_gzip_member_header_idx['raw']['xflags']); |
---|
| 103 | |
---|
| 104 | $info_gzip_member_header_idx['os'] = $this->get_os_type($info_gzip_member_header_idx['raw']['os']); |
---|
| 105 | if (!$info_gzip_member_header_idx['os']) { |
---|
| 106 | $info['error'][] = 'Read error on gzip file'; |
---|
| 107 | return false; |
---|
| 108 | } |
---|
| 109 | |
---|
| 110 | $fpointer = 10; |
---|
| 111 | $arr_xsubfield = array (); |
---|
| 112 | |
---|
| 113 | // bit 2 - FLG.FEXTRA |
---|
| 114 | //+---+---+=================================+ |
---|
| 115 | //| XLEN |...XLEN bytes of "extra field"...| |
---|
| 116 | //+---+---+=================================+ |
---|
| 117 | |
---|
| 118 | if ($info_gzip_member_header_idx['flags']['extra']) { |
---|
| 119 | $w_xlen = substr($buff, $fpointer, 2); |
---|
| 120 | $xlen = getid3_lib::LittleEndian2Int($w_xlen); |
---|
| 121 | $fpointer += 2; |
---|
| 122 | |
---|
| 123 | $info_gzip_member_header_idx['raw']['xfield'] = substr($buff, $fpointer, $xlen); |
---|
| 124 | |
---|
| 125 | // Extra SubFields |
---|
| 126 | //+---+---+---+---+==================================+ |
---|
| 127 | //|SI1|SI2| LEN |... LEN bytes of subfield data ...| |
---|
| 128 | //+---+---+---+---+==================================+ |
---|
| 129 | |
---|
| 130 | $idx = 0; |
---|
| 131 | while (true) { |
---|
| 132 | if ($idx >= $xlen) { |
---|
| 133 | break; |
---|
| 134 | } |
---|
| 135 | $si1 = ord(substr($buff, $fpointer + $idx++, 1)); |
---|
| 136 | $si2 = ord(substr($buff, $fpointer + $idx++, 1)); |
---|
| 137 | if (($si1 == 0x41) && ($si2 == 0x70)) { |
---|
| 138 | $w_xsublen = substr($buff, $fpointer+$idx, 2); |
---|
| 139 | $xsublen = getid3_lib::LittleEndian2Int($w_xsublen); |
---|
| 140 | $idx += 2; |
---|
| 141 | $arr_xsubfield[] = substr($buff, $fpointer+$idx, $xsublen); |
---|
| 142 | $idx += $xsublen; |
---|
| 143 | } else { |
---|
| 144 | break; |
---|
| 145 | } |
---|
| 146 | } |
---|
| 147 | $fpointer += $xlen; |
---|
| 148 | } |
---|
| 149 | |
---|
| 150 | // bit 3 - FLG.FNAME |
---|
| 151 | //+=========================================+ |
---|
| 152 | //|...original file name, zero-terminated...| |
---|
| 153 | //+=========================================+ |
---|
| 154 | // GZIP files may have only one file, with no filename, so assume original filename is current filename without .gz |
---|
| 155 | |
---|
| 156 | $info_gzip_member_header_idx['filename'] = eregi_replace('.gz$', '', @$info['filename']); |
---|
| 157 | if ($info_gzip_member_header_idx['flags']['filename']) { |
---|
| 158 | while (true) { |
---|
| 159 | if (ord($buff[$fpointer]) == 0) { |
---|
| 160 | $fpointer++; |
---|
| 161 | break; |
---|
| 162 | } |
---|
| 163 | $info_gzip_member_header_idx['filename'] .= $buff[$fpointer]; |
---|
| 164 | $fpointer++; |
---|
| 165 | } |
---|
| 166 | } |
---|
| 167 | |
---|
| 168 | // bit 4 - FLG.FCOMMENT |
---|
| 169 | //+===================================+ |
---|
| 170 | //|...file comment, zero-terminated...| |
---|
| 171 | //+===================================+ |
---|
| 172 | |
---|
| 173 | if ($info_gzip_member_header_idx['flags']['comment']) { |
---|
| 174 | while (true) { |
---|
| 175 | if (ord($buff[$fpointer]) == 0) { |
---|
| 176 | $fpointer++; |
---|
| 177 | break; |
---|
| 178 | } |
---|
| 179 | $info_gzip_member_header_idx['comment'] .= $buff[$fpointer]; |
---|
| 180 | $fpointer++; |
---|
| 181 | } |
---|
| 182 | } |
---|
| 183 | |
---|
| 184 | // bit 1 - FLG.FHCRC |
---|
| 185 | //+---+---+ |
---|
| 186 | //| CRC16 | |
---|
| 187 | //+---+---+ |
---|
| 188 | |
---|
| 189 | if ($info_gzip_member_header_idx['flags']['crc16']) { |
---|
| 190 | $w_crc = substr($buff, $fpointer, 2); |
---|
| 191 | $info_gzip_member_header_idx['crc16'] = getid3_lib::LittleEndian2Int($w_crc); |
---|
| 192 | $fpointer += 2; |
---|
| 193 | } |
---|
| 194 | |
---|
| 195 | // bit 0 - FLG.FTEXT |
---|
| 196 | //if ($info_gzip_member_header_idx['raw']['flags'] & 0x01) { |
---|
| 197 | // Ignored... |
---|
| 198 | //} |
---|
| 199 | // bits 5, 6, 7 - reserved |
---|
| 200 | |
---|
| 201 | $info_gzip_member_header_idx['crc32'] = getid3_lib::LittleEndian2Int(substr($buff, strlen($buff) - 8, 4)); |
---|
| 202 | $info_gzip_member_header_idx['filesize'] = getid3_lib::LittleEndian2Int(substr($buff, strlen($buff) - 4)); |
---|
| 203 | |
---|
| 204 | if ($this->option_gzip_parse_contents) { |
---|
| 205 | |
---|
| 206 | // Try to inflate GZip |
---|
| 207 | |
---|
| 208 | if (!function_exists('gzinflate')) { |
---|
| 209 | $this->getid3->warning('PHP does not have zlib support - contents not parsed.'); |
---|
| 210 | return true; |
---|
| 211 | } |
---|
| 212 | |
---|
| 213 | $csize = 0; |
---|
| 214 | $inflated = ''; |
---|
| 215 | $chkcrc32 = ''; |
---|
| 216 | |
---|
| 217 | $cdata = substr($buff, $fpointer); |
---|
| 218 | $cdata = substr($cdata, 0, strlen($cdata) - 8); |
---|
| 219 | $csize = strlen($cdata); |
---|
| 220 | $inflated = gzinflate($cdata); |
---|
| 221 | |
---|
| 222 | // Calculate CRC32 for inflated content |
---|
| 223 | $info_gzip_member_header_idx['crc32_valid'] = (bool) (sprintf('%u', crc32($inflated)) == $info_gzip_member_header_idx['crc32']); |
---|
| 224 | |
---|
| 225 | |
---|
| 226 | //// Analyse contents |
---|
| 227 | |
---|
| 228 | // write content to temp file |
---|
| 229 | if (($temp_file_name = tempnam('*', 'getID3')) === false) { |
---|
| 230 | throw new getid3_exception('Unable to create temporary file.'); |
---|
| 231 | } |
---|
| 232 | |
---|
| 233 | if ($tmp = fopen($temp_file_name, 'wb')) { |
---|
| 234 | fwrite($tmp, $inflated); |
---|
| 235 | fclose($tmp); |
---|
| 236 | |
---|
| 237 | // clone getid3 - we want same settings |
---|
| 238 | $clone = clone $this->getid3; |
---|
| 239 | unset($clone->info); |
---|
| 240 | try { |
---|
| 241 | $clone->Analyze($temp_file_name); |
---|
| 242 | $info_gzip_member_header_idx['parsed_content'] = $clone->info; |
---|
| 243 | } |
---|
| 244 | catch (getid3_exception $e) { |
---|
| 245 | // unable to parse contents |
---|
| 246 | } |
---|
| 247 | |
---|
| 248 | unlink($temp_file_name); |
---|
| 249 | } |
---|
| 250 | |
---|
| 251 | // Unknown/unhandled format |
---|
| 252 | else { |
---|
| 253 | |
---|
| 254 | } |
---|
| 255 | } |
---|
| 256 | } |
---|
| 257 | return true; |
---|
| 258 | } |
---|
| 259 | |
---|
| 260 | |
---|
| 261 | // Converts the OS type |
---|
| 262 | public static function get_os_type($key) { |
---|
| 263 | static $os_type = array ( |
---|
| 264 | '0' => 'FAT filesystem (MS-DOS, OS/2, NT/Win32)', |
---|
| 265 | '1' => 'Amiga', |
---|
| 266 | '2' => 'VMS (or OpenVMS)', |
---|
| 267 | '3' => 'Unix', |
---|
| 268 | '4' => 'VM/CMS', |
---|
| 269 | '5' => 'Atari TOS', |
---|
| 270 | '6' => 'HPFS filesystem (OS/2, NT)', |
---|
| 271 | '7' => 'Macintosh', |
---|
| 272 | '8' => 'Z-System', |
---|
| 273 | '9' => 'CP/M', |
---|
| 274 | '10' => 'TOPS-20', |
---|
| 275 | '11' => 'NTFS filesystem (NT)', |
---|
| 276 | '12' => 'QDOS', |
---|
| 277 | '13' => 'Acorn RISCOS', |
---|
| 278 | '255' => 'unknown' |
---|
| 279 | ); |
---|
| 280 | return @$os_type[$key]; |
---|
| 281 | } |
---|
| 282 | |
---|
| 283 | |
---|
| 284 | // Converts the eXtra FLags |
---|
| 285 | public static function get_xflag_type($key) { |
---|
| 286 | static $xflag_type = array ( |
---|
| 287 | '0' => 'unknown', |
---|
| 288 | '2' => 'maximum compression', |
---|
| 289 | '4' => 'fastest algorithm' |
---|
| 290 | ); |
---|
| 291 | return @$xflag_type[$key]; |
---|
| 292 | } |
---|
| 293 | |
---|
| 294 | } |
---|
| 295 | |
---|
| 296 | ?> |
---|