MacBinary.php 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270
  1. <?php
  2. /**
  3. * MacBinary signature checker and data fork extractor, for files
  4. * uploaded from Internet Explorer for Mac.
  5. *
  6. * Copyright (C) 2005 Brion Vibber <brion@pobox.com>
  7. * Portions based on Convert::BinHex by Eryq et al
  8. * http://www.mediawiki.org/
  9. *
  10. * This program is free software; you can redistribute it and/or modify
  11. * it under the terms of the GNU General Public License as published by
  12. * the Free Software Foundation; either version 2 of the License, or
  13. * (at your option) any later version.
  14. *
  15. * This program is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  18. * GNU General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU General Public License along
  21. * with this program; if not, write to the Free Software Foundation, Inc.,
  22. * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
  23. * http://www.gnu.org/copyleft/gpl.html
  24. *
  25. * @ingroup SpecialPage
  26. */
  27. class MacBinary {
  28. function __construct( $filename ) {
  29. $this->open( $filename );
  30. $this->loadHeader();
  31. }
  32. /**
  33. * The file must be seekable, such as local filesystem.
  34. * Remote URLs probably won't work.
  35. *
  36. * @param string $filename
  37. */
  38. function open( $filename ) {
  39. $this->valid = false;
  40. $this->version = 0;
  41. $this->filename = '';
  42. $this->dataLength = 0;
  43. $this->resourceLength = 0;
  44. $this->handle = fopen( $filename, 'rb' );
  45. }
  46. /**
  47. * Does this appear to be a valid MacBinary archive?
  48. * @return bool
  49. */
  50. function isValid() {
  51. return $this->valid;
  52. }
  53. /**
  54. * Get length of data fork
  55. * @return int
  56. */
  57. function dataForkLength() {
  58. return $this->dataLength;
  59. }
  60. /**
  61. * Copy the data fork to an external file or resource.
  62. * @param resource $destination
  63. * @return bool
  64. */
  65. function extractData( $destination ) {
  66. if( !$this->isValid() ) {
  67. return false;
  68. }
  69. // Data fork appears immediately after header
  70. fseek( $this->handle, 128 );
  71. return $this->copyBytesTo( $destination, $this->dataLength );
  72. }
  73. /**
  74. *
  75. */
  76. function close() {
  77. fclose( $this->handle );
  78. }
  79. // --------------------------------------------------------------
  80. /**
  81. * Check if the given file appears to be MacBinary-encoded,
  82. * as Internet Explorer on Mac OS may provide for unknown types.
  83. * http://www.lazerware.com/formats/macbinary/macbinary_iii.html
  84. * If ok, load header data.
  85. *
  86. * @return bool
  87. * @access private
  88. */
  89. function loadHeader() {
  90. $fname = 'MacBinary::loadHeader';
  91. fseek( $this->handle, 0 );
  92. $head = fread( $this->handle, 128 );
  93. #$this->hexdump( $head );
  94. if( strlen( $head ) < 128 ) {
  95. wfDebug( "$fname: couldn't read full MacBinary header\n" );
  96. return false;
  97. }
  98. if( $head{0} != "\x00" || $head{74} != "\x00" ) {
  99. wfDebug( "$fname: header bytes 0 and 74 not null\n" );
  100. return false;
  101. }
  102. $signature = substr( $head, 102, 4 );
  103. $a = unpack( "ncrc", substr( $head, 124, 2 ) );
  104. $storedCRC = $a['crc'];
  105. $calculatedCRC = $this->calcCRC( substr( $head, 0, 124 ) );
  106. if( $storedCRC == $calculatedCRC ) {
  107. if( $signature == 'mBIN' ) {
  108. $this->version = 3;
  109. } else {
  110. $this->version = 2;
  111. }
  112. } else {
  113. $crc = sprintf( "%x != %x", $storedCRC, $calculatedCRC );
  114. if( $storedCRC == 0 && $head{82} == "\x00" &&
  115. substr( $head, 101, 24 ) == str_repeat( "\x00", 24 ) ) {
  116. wfDebug( "$fname: no CRC, looks like MacBinary I\n" );
  117. $this->version = 1;
  118. } elseif( $signature == 'mBIN' && $storedCRC == 0x185 ) {
  119. // Mac IE 5.0 seems to insert this value in the CRC field.
  120. // 5.2.3 works correctly; don't know about other versions.
  121. wfDebug( "$fname: CRC doesn't match ($crc), looks like Mac IE 5.0\n" );
  122. $this->version = 3;
  123. } else {
  124. wfDebug( "$fname: CRC doesn't match ($crc) and not MacBinary I\n" );
  125. return false;
  126. }
  127. }
  128. $nameLength = ord( $head{1} );
  129. if( $nameLength < 1 || $nameLength > 63 ) {
  130. wfDebug( "$fname: invalid filename size $nameLength\n" );
  131. return false;
  132. }
  133. $this->filename = substr( $head, 2, $nameLength );
  134. $forks = unpack( "Ndata/Nresource", substr( $head, 83, 8 ) );
  135. $this->dataLength = $forks['data'];
  136. $this->resourceLength = $forks['resource'];
  137. $maxForkLength = 0x7fffff;
  138. if( $this->dataLength < 0 || $this->dataLength > $maxForkLength ) {
  139. wfDebug( "$fname: invalid data fork length $this->dataLength\n" );
  140. return false;
  141. }
  142. if( $this->resourceLength < 0 || $this->resourceLength > $maxForkLength ) {
  143. wfDebug( "$fname: invalid resource fork size $this->resourceLength\n" );
  144. return false;
  145. }
  146. wfDebug( "$fname: appears to be MacBinary $this->version, data length $this->dataLength\n" );
  147. $this->valid = true;
  148. return true;
  149. }
  150. /**
  151. * Calculate a 16-bit CRC value as for MacBinary headers.
  152. * Adapted from perl5 Convert::BinHex by Eryq,
  153. * based on the mcvert utility (Doug Moore, April '87),
  154. * with magic array thingy by Jim Van Verth.
  155. * http://search.cpan.org/~eryq/Convert-BinHex-1.119/lib/Convert/BinHex.pm
  156. *
  157. * @param string $data
  158. * @param int $seed
  159. * @return int
  160. * @access private
  161. */
  162. function calcCRC( $data, $seed = 0 ) {
  163. # An array useful for CRC calculations that use 0x1021 as the "seed":
  164. $MAGIC = array(
  165. 0x0000, 0x1021, 0x2042, 0x3063, 0x4084, 0x50a5, 0x60c6, 0x70e7,
  166. 0x8108, 0x9129, 0xa14a, 0xb16b, 0xc18c, 0xd1ad, 0xe1ce, 0xf1ef,
  167. 0x1231, 0x0210, 0x3273, 0x2252, 0x52b5, 0x4294, 0x72f7, 0x62d6,
  168. 0x9339, 0x8318, 0xb37b, 0xa35a, 0xd3bd, 0xc39c, 0xf3ff, 0xe3de,
  169. 0x2462, 0x3443, 0x0420, 0x1401, 0x64e6, 0x74c7, 0x44a4, 0x5485,
  170. 0xa56a, 0xb54b, 0x8528, 0x9509, 0xe5ee, 0xf5cf, 0xc5ac, 0xd58d,
  171. 0x3653, 0x2672, 0x1611, 0x0630, 0x76d7, 0x66f6, 0x5695, 0x46b4,
  172. 0xb75b, 0xa77a, 0x9719, 0x8738, 0xf7df, 0xe7fe, 0xd79d, 0xc7bc,
  173. 0x48c4, 0x58e5, 0x6886, 0x78a7, 0x0840, 0x1861, 0x2802, 0x3823,
  174. 0xc9cc, 0xd9ed, 0xe98e, 0xf9af, 0x8948, 0x9969, 0xa90a, 0xb92b,
  175. 0x5af5, 0x4ad4, 0x7ab7, 0x6a96, 0x1a71, 0x0a50, 0x3a33, 0x2a12,
  176. 0xdbfd, 0xcbdc, 0xfbbf, 0xeb9e, 0x9b79, 0x8b58, 0xbb3b, 0xab1a,
  177. 0x6ca6, 0x7c87, 0x4ce4, 0x5cc5, 0x2c22, 0x3c03, 0x0c60, 0x1c41,
  178. 0xedae, 0xfd8f, 0xcdec, 0xddcd, 0xad2a, 0xbd0b, 0x8d68, 0x9d49,
  179. 0x7e97, 0x6eb6, 0x5ed5, 0x4ef4, 0x3e13, 0x2e32, 0x1e51, 0x0e70,
  180. 0xff9f, 0xefbe, 0xdfdd, 0xcffc, 0xbf1b, 0xaf3a, 0x9f59, 0x8f78,
  181. 0x9188, 0x81a9, 0xb1ca, 0xa1eb, 0xd10c, 0xc12d, 0xf14e, 0xe16f,
  182. 0x1080, 0x00a1, 0x30c2, 0x20e3, 0x5004, 0x4025, 0x7046, 0x6067,
  183. 0x83b9, 0x9398, 0xa3fb, 0xb3da, 0xc33d, 0xd31c, 0xe37f, 0xf35e,
  184. 0x02b1, 0x1290, 0x22f3, 0x32d2, 0x4235, 0x5214, 0x6277, 0x7256,
  185. 0xb5ea, 0xa5cb, 0x95a8, 0x8589, 0xf56e, 0xe54f, 0xd52c, 0xc50d,
  186. 0x34e2, 0x24c3, 0x14a0, 0x0481, 0x7466, 0x6447, 0x5424, 0x4405,
  187. 0xa7db, 0xb7fa, 0x8799, 0x97b8, 0xe75f, 0xf77e, 0xc71d, 0xd73c,
  188. 0x26d3, 0x36f2, 0x0691, 0x16b0, 0x6657, 0x7676, 0x4615, 0x5634,
  189. 0xd94c, 0xc96d, 0xf90e, 0xe92f, 0x99c8, 0x89e9, 0xb98a, 0xa9ab,
  190. 0x5844, 0x4865, 0x7806, 0x6827, 0x18c0, 0x08e1, 0x3882, 0x28a3,
  191. 0xcb7d, 0xdb5c, 0xeb3f, 0xfb1e, 0x8bf9, 0x9bd8, 0xabbb, 0xbb9a,
  192. 0x4a75, 0x5a54, 0x6a37, 0x7a16, 0x0af1, 0x1ad0, 0x2ab3, 0x3a92,
  193. 0xfd2e, 0xed0f, 0xdd6c, 0xcd4d, 0xbdaa, 0xad8b, 0x9de8, 0x8dc9,
  194. 0x7c26, 0x6c07, 0x5c64, 0x4c45, 0x3ca2, 0x2c83, 0x1ce0, 0x0cc1,
  195. 0xef1f, 0xff3e, 0xcf5d, 0xdf7c, 0xaf9b, 0xbfba, 0x8fd9, 0x9ff8,
  196. 0x6e17, 0x7e36, 0x4e55, 0x5e74, 0x2e93, 0x3eb2, 0x0ed1, 0x1ef0
  197. );
  198. $len = strlen( $data );
  199. $crc = $seed;
  200. for( $i = 0; $i < $len; $i++ ) {
  201. $crc ^= ord( $data{$i} ) << 8;
  202. $crc &= 0xFFFF;
  203. $crc = ($crc << 8) ^ $MAGIC[$crc >> 8];
  204. $crc &= 0xFFFF;
  205. }
  206. return $crc;
  207. }
  208. /**
  209. * @param resource $destination
  210. * @param int $bytesToCopy
  211. * @return bool
  212. * @access private
  213. */
  214. function copyBytesTo( $destination, $bytesToCopy ) {
  215. $bufferSize = 65536;
  216. for( $remaining = $bytesToCopy; $remaining > 0; $remaining -= $bufferSize ) {
  217. $thisChunkSize = min( $remaining, $bufferSize );
  218. $buffer = fread( $this->handle, $thisChunkSize );
  219. fwrite( $destination, $buffer );
  220. }
  221. }
  222. /**
  223. * Hex dump of the header for debugging
  224. * @access private
  225. */
  226. function hexdump( $data ) {
  227. global $wgDebugLogFile;
  228. if( !$wgDebugLogFile ) return;
  229. $width = 16;
  230. $at = 0;
  231. for( $remaining = strlen( $data ); $remaining > 0; $remaining -= $width ) {
  232. $line = sprintf( "%04x:", $at );
  233. $printable = '';
  234. for( $i = 0; $i < $width && $remaining - $i > 0; $i++ ) {
  235. $byte = ord( $data{$at++} );
  236. $line .= sprintf( " %02x", $byte );
  237. $printable .= ($byte >= 32 && $byte <= 126 )
  238. ? chr( $byte )
  239. : '.';
  240. }
  241. if( $i < $width ) {
  242. $line .= str_repeat( ' ', $width - $i );
  243. }
  244. wfDebug( "MacBinary: $line $printable\n" );
  245. }
  246. }
  247. }