ImageFile.py 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697
  1. #
  2. # The Python Imaging Library.
  3. # $Id$
  4. #
  5. # base class for image file handlers
  6. #
  7. # history:
  8. # 1995-09-09 fl Created
  9. # 1996-03-11 fl Fixed load mechanism.
  10. # 1996-04-15 fl Added pcx/xbm decoders.
  11. # 1996-04-30 fl Added encoders.
  12. # 1996-12-14 fl Added load helpers
  13. # 1997-01-11 fl Use encode_to_file where possible
  14. # 1997-08-27 fl Flush output in _save
  15. # 1998-03-05 fl Use memory mapping for some modes
  16. # 1999-02-04 fl Use memory mapping also for "I;16" and "I;16B"
  17. # 1999-05-31 fl Added image parser
  18. # 2000-10-12 fl Set readonly flag on memory-mapped images
  19. # 2002-03-20 fl Use better messages for common decoder errors
  20. # 2003-04-21 fl Fall back on mmap/map_buffer if map is not available
  21. # 2003-10-30 fl Added StubImageFile class
  22. # 2004-02-25 fl Made incremental parser more robust
  23. #
  24. # Copyright (c) 1997-2004 by Secret Labs AB
  25. # Copyright (c) 1995-2004 by Fredrik Lundh
  26. #
  27. # See the README file for information on usage and redistribution.
  28. #
  29. import io
  30. import struct
  31. import sys
  32. import warnings
  33. from . import Image
  34. from ._util import isPath
  35. MAXBLOCK = 65536
  36. SAFEBLOCK = 1024 * 1024
  37. LOAD_TRUNCATED_IMAGES = False
  38. """Whether or not to load truncated image files. User code may change this."""
  39. ERRORS = {
  40. -1: "image buffer overrun error",
  41. -2: "decoding error",
  42. -3: "unknown error",
  43. -8: "bad configuration",
  44. -9: "out of memory error",
  45. }
  46. """Dict of known error codes returned from :meth:`.PyDecoder.decode`."""
  47. #
  48. # --------------------------------------------------------------------
  49. # Helpers
  50. def raise_oserror(error):
  51. try:
  52. message = Image.core.getcodecstatus(error)
  53. except AttributeError:
  54. message = ERRORS.get(error)
  55. if not message:
  56. message = f"decoder error {error}"
  57. raise OSError(message + " when reading image file")
  58. def raise_ioerror(error):
  59. warnings.warn(
  60. "raise_ioerror is deprecated and will be removed in a future release. "
  61. "Use raise_oserror instead.",
  62. DeprecationWarning,
  63. )
  64. return raise_oserror(error)
  65. def _tilesort(t):
  66. # sort on offset
  67. return t[2]
  68. #
  69. # --------------------------------------------------------------------
  70. # ImageFile base class
  71. class ImageFile(Image.Image):
  72. """Base class for image file format handlers."""
  73. def __init__(self, fp=None, filename=None):
  74. super().__init__()
  75. self._min_frame = 0
  76. self.custom_mimetype = None
  77. self.tile = None
  78. """ A list of tile descriptors, or ``None`` """
  79. self.readonly = 1 # until we know better
  80. self.decoderconfig = ()
  81. self.decodermaxblock = MAXBLOCK
  82. if isPath(fp):
  83. # filename
  84. self.fp = open(fp, "rb")
  85. self.filename = fp
  86. self._exclusive_fp = True
  87. else:
  88. # stream
  89. self.fp = fp
  90. self.filename = filename
  91. # can be overridden
  92. self._exclusive_fp = None
  93. try:
  94. try:
  95. self._open()
  96. except (
  97. IndexError, # end of data
  98. TypeError, # end of data (ord)
  99. KeyError, # unsupported mode
  100. EOFError, # got header but not the first frame
  101. struct.error,
  102. ) as v:
  103. raise SyntaxError(v) from v
  104. if not self.mode or self.size[0] <= 0:
  105. raise SyntaxError("not identified by this driver")
  106. except BaseException:
  107. # close the file only if we have opened it this constructor
  108. if self._exclusive_fp:
  109. self.fp.close()
  110. raise
  111. def get_format_mimetype(self):
  112. if self.custom_mimetype:
  113. return self.custom_mimetype
  114. if self.format is not None:
  115. return Image.MIME.get(self.format.upper())
  116. def verify(self):
  117. """Check file integrity"""
  118. # raise exception if something's wrong. must be called
  119. # directly after open, and closes file when finished.
  120. if self._exclusive_fp:
  121. self.fp.close()
  122. self.fp = None
  123. def load(self):
  124. """Load image data based on tile list"""
  125. if self.tile is None:
  126. raise OSError("cannot load this image")
  127. pixel = Image.Image.load(self)
  128. if not self.tile:
  129. return pixel
  130. self.map = None
  131. use_mmap = self.filename and len(self.tile) == 1
  132. # As of pypy 2.1.0, memory mapping was failing here.
  133. use_mmap = use_mmap and not hasattr(sys, "pypy_version_info")
  134. readonly = 0
  135. # look for read/seek overrides
  136. try:
  137. read = self.load_read
  138. # don't use mmap if there are custom read/seek functions
  139. use_mmap = False
  140. except AttributeError:
  141. read = self.fp.read
  142. try:
  143. seek = self.load_seek
  144. use_mmap = False
  145. except AttributeError:
  146. seek = self.fp.seek
  147. if use_mmap:
  148. # try memory mapping
  149. decoder_name, extents, offset, args = self.tile[0]
  150. if (
  151. decoder_name == "raw"
  152. and len(args) >= 3
  153. and args[0] == self.mode
  154. and args[0] in Image._MAPMODES
  155. ):
  156. try:
  157. if hasattr(Image.core, "map"):
  158. # use built-in mapper WIN32 only
  159. self.map = Image.core.map(self.filename)
  160. self.map.seek(offset)
  161. self.im = self.map.readimage(
  162. self.mode, self.size, args[1], args[2]
  163. )
  164. else:
  165. # use mmap, if possible
  166. import mmap
  167. with open(self.filename) as fp:
  168. self.map = mmap.mmap(
  169. fp.fileno(), 0, access=mmap.ACCESS_READ
  170. )
  171. self.im = Image.core.map_buffer(
  172. self.map, self.size, decoder_name, offset, args
  173. )
  174. readonly = 1
  175. # After trashing self.im,
  176. # we might need to reload the palette data.
  177. if self.palette:
  178. self.palette.dirty = 1
  179. except (AttributeError, OSError, ImportError):
  180. self.map = None
  181. self.load_prepare()
  182. err_code = -3 # initialize to unknown error
  183. if not self.map:
  184. # sort tiles in file order
  185. self.tile.sort(key=_tilesort)
  186. try:
  187. # FIXME: This is a hack to handle TIFF's JpegTables tag.
  188. prefix = self.tile_prefix
  189. except AttributeError:
  190. prefix = b""
  191. for decoder_name, extents, offset, args in self.tile:
  192. decoder = Image._getdecoder(
  193. self.mode, decoder_name, args, self.decoderconfig
  194. )
  195. try:
  196. seek(offset)
  197. decoder.setimage(self.im, extents)
  198. if decoder.pulls_fd:
  199. decoder.setfd(self.fp)
  200. status, err_code = decoder.decode(b"")
  201. else:
  202. b = prefix
  203. while True:
  204. try:
  205. s = read(self.decodermaxblock)
  206. except (IndexError, struct.error) as e:
  207. # truncated png/gif
  208. if LOAD_TRUNCATED_IMAGES:
  209. break
  210. else:
  211. raise OSError("image file is truncated") from e
  212. if not s: # truncated jpeg
  213. if LOAD_TRUNCATED_IMAGES:
  214. break
  215. else:
  216. raise OSError(
  217. "image file is truncated "
  218. f"({len(b)} bytes not processed)"
  219. )
  220. b = b + s
  221. n, err_code = decoder.decode(b)
  222. if n < 0:
  223. break
  224. b = b[n:]
  225. finally:
  226. # Need to cleanup here to prevent leaks
  227. decoder.cleanup()
  228. self.tile = []
  229. self.readonly = readonly
  230. self.load_end()
  231. if self._exclusive_fp and self._close_exclusive_fp_after_loading:
  232. self.fp.close()
  233. self.fp = None
  234. if not self.map and not LOAD_TRUNCATED_IMAGES and err_code < 0:
  235. # still raised if decoder fails to return anything
  236. raise_oserror(err_code)
  237. return Image.Image.load(self)
  238. def load_prepare(self):
  239. # create image memory if necessary
  240. if not self.im or self.im.mode != self.mode or self.im.size != self.size:
  241. self.im = Image.core.new(self.mode, self.size)
  242. # create palette (optional)
  243. if self.mode == "P":
  244. Image.Image.load(self)
  245. def load_end(self):
  246. # may be overridden
  247. pass
  248. # may be defined for contained formats
  249. # def load_seek(self, pos):
  250. # pass
  251. # may be defined for blocked formats (e.g. PNG)
  252. # def load_read(self, bytes):
  253. # pass
  254. def _seek_check(self, frame):
  255. if (
  256. frame < self._min_frame
  257. # Only check upper limit on frames if additional seek operations
  258. # are not required to do so
  259. or (
  260. not (hasattr(self, "_n_frames") and self._n_frames is None)
  261. and frame >= self.n_frames + self._min_frame
  262. )
  263. ):
  264. raise EOFError("attempt to seek outside sequence")
  265. return self.tell() != frame
  266. class StubImageFile(ImageFile):
  267. """
  268. Base class for stub image loaders.
  269. A stub loader is an image loader that can identify files of a
  270. certain format, but relies on external code to load the file.
  271. """
  272. def _open(self):
  273. raise NotImplementedError("StubImageFile subclass must implement _open")
  274. def load(self):
  275. loader = self._load()
  276. if loader is None:
  277. raise OSError(f"cannot find loader for this {self.format} file")
  278. image = loader.load(self)
  279. assert image is not None
  280. # become the other object (!)
  281. self.__class__ = image.__class__
  282. self.__dict__ = image.__dict__
  283. def _load(self):
  284. """(Hook) Find actual image loader."""
  285. raise NotImplementedError("StubImageFile subclass must implement _load")
  286. class Parser:
  287. """
  288. Incremental image parser. This class implements the standard
  289. feed/close consumer interface.
  290. """
  291. incremental = None
  292. image = None
  293. data = None
  294. decoder = None
  295. offset = 0
  296. finished = 0
  297. def reset(self):
  298. """
  299. (Consumer) Reset the parser. Note that you can only call this
  300. method immediately after you've created a parser; parser
  301. instances cannot be reused.
  302. """
  303. assert self.data is None, "cannot reuse parsers"
  304. def feed(self, data):
  305. """
  306. (Consumer) Feed data to the parser.
  307. :param data: A string buffer.
  308. :exception OSError: If the parser failed to parse the image file.
  309. """
  310. # collect data
  311. if self.finished:
  312. return
  313. if self.data is None:
  314. self.data = data
  315. else:
  316. self.data = self.data + data
  317. # parse what we have
  318. if self.decoder:
  319. if self.offset > 0:
  320. # skip header
  321. skip = min(len(self.data), self.offset)
  322. self.data = self.data[skip:]
  323. self.offset = self.offset - skip
  324. if self.offset > 0 or not self.data:
  325. return
  326. n, e = self.decoder.decode(self.data)
  327. if n < 0:
  328. # end of stream
  329. self.data = None
  330. self.finished = 1
  331. if e < 0:
  332. # decoding error
  333. self.image = None
  334. raise_oserror(e)
  335. else:
  336. # end of image
  337. return
  338. self.data = self.data[n:]
  339. elif self.image:
  340. # if we end up here with no decoder, this file cannot
  341. # be incrementally parsed. wait until we've gotten all
  342. # available data
  343. pass
  344. else:
  345. # attempt to open this file
  346. try:
  347. with io.BytesIO(self.data) as fp:
  348. im = Image.open(fp)
  349. except OSError:
  350. # traceback.print_exc()
  351. pass # not enough data
  352. else:
  353. flag = hasattr(im, "load_seek") or hasattr(im, "load_read")
  354. if flag or len(im.tile) != 1:
  355. # custom load code, or multiple tiles
  356. self.decode = None
  357. else:
  358. # initialize decoder
  359. im.load_prepare()
  360. d, e, o, a = im.tile[0]
  361. im.tile = []
  362. self.decoder = Image._getdecoder(im.mode, d, a, im.decoderconfig)
  363. self.decoder.setimage(im.im, e)
  364. # calculate decoder offset
  365. self.offset = o
  366. if self.offset <= len(self.data):
  367. self.data = self.data[self.offset :]
  368. self.offset = 0
  369. self.image = im
  370. def __enter__(self):
  371. return self
  372. def __exit__(self, *args):
  373. self.close()
  374. def close(self):
  375. """
  376. (Consumer) Close the stream.
  377. :returns: An image object.
  378. :exception OSError: If the parser failed to parse the image file either
  379. because it cannot be identified or cannot be
  380. decoded.
  381. """
  382. # finish decoding
  383. if self.decoder:
  384. # get rid of what's left in the buffers
  385. self.feed(b"")
  386. self.data = self.decoder = None
  387. if not self.finished:
  388. raise OSError("image was incomplete")
  389. if not self.image:
  390. raise OSError("cannot parse this image")
  391. if self.data:
  392. # incremental parsing not possible; reopen the file
  393. # not that we have all data
  394. with io.BytesIO(self.data) as fp:
  395. try:
  396. self.image = Image.open(fp)
  397. finally:
  398. self.image.load()
  399. return self.image
  400. # --------------------------------------------------------------------
  401. def _save(im, fp, tile, bufsize=0):
  402. """Helper to save image based on tile list
  403. :param im: Image object.
  404. :param fp: File object.
  405. :param tile: Tile list.
  406. :param bufsize: Optional buffer size
  407. """
  408. im.load()
  409. if not hasattr(im, "encoderconfig"):
  410. im.encoderconfig = ()
  411. tile.sort(key=_tilesort)
  412. # FIXME: make MAXBLOCK a configuration parameter
  413. # It would be great if we could have the encoder specify what it needs
  414. # But, it would need at least the image size in most cases. RawEncode is
  415. # a tricky case.
  416. bufsize = max(MAXBLOCK, bufsize, im.size[0] * 4) # see RawEncode.c
  417. if fp == sys.stdout:
  418. fp.flush()
  419. return
  420. try:
  421. fh = fp.fileno()
  422. fp.flush()
  423. except (AttributeError, io.UnsupportedOperation) as exc:
  424. # compress to Python file-compatible object
  425. for e, b, o, a in tile:
  426. e = Image._getencoder(im.mode, e, a, im.encoderconfig)
  427. if o > 0:
  428. fp.seek(o)
  429. e.setimage(im.im, b)
  430. if e.pushes_fd:
  431. e.setfd(fp)
  432. l, s = e.encode_to_pyfd()
  433. else:
  434. while True:
  435. l, s, d = e.encode(bufsize)
  436. fp.write(d)
  437. if s:
  438. break
  439. if s < 0:
  440. raise OSError(f"encoder error {s} when writing image file") from exc
  441. e.cleanup()
  442. else:
  443. # slight speedup: compress to real file object
  444. for e, b, o, a in tile:
  445. e = Image._getencoder(im.mode, e, a, im.encoderconfig)
  446. if o > 0:
  447. fp.seek(o)
  448. e.setimage(im.im, b)
  449. if e.pushes_fd:
  450. e.setfd(fp)
  451. l, s = e.encode_to_pyfd()
  452. else:
  453. s = e.encode_to_file(fh, bufsize)
  454. if s < 0:
  455. raise OSError(f"encoder error {s} when writing image file")
  456. e.cleanup()
  457. if hasattr(fp, "flush"):
  458. fp.flush()
  459. def _safe_read(fp, size):
  460. """
  461. Reads large blocks in a safe way. Unlike fp.read(n), this function
  462. doesn't trust the user. If the requested size is larger than
  463. SAFEBLOCK, the file is read block by block.
  464. :param fp: File handle. Must implement a <b>read</b> method.
  465. :param size: Number of bytes to read.
  466. :returns: A string containing up to <i>size</i> bytes of data.
  467. """
  468. if size <= 0:
  469. return b""
  470. if size <= SAFEBLOCK:
  471. return fp.read(size)
  472. data = []
  473. while size > 0:
  474. block = fp.read(min(size, SAFEBLOCK))
  475. if not block:
  476. break
  477. data.append(block)
  478. size -= len(block)
  479. return b"".join(data)
  480. class PyCodecState:
  481. def __init__(self):
  482. self.xsize = 0
  483. self.ysize = 0
  484. self.xoff = 0
  485. self.yoff = 0
  486. def extents(self):
  487. return (self.xoff, self.yoff, self.xoff + self.xsize, self.yoff + self.ysize)
  488. class PyDecoder:
  489. """
  490. Python implementation of a format decoder. Override this class and
  491. add the decoding logic in the :meth:`decode` method.
  492. See :ref:`Writing Your Own File Decoder in Python<file-decoders-py>`
  493. """
  494. _pulls_fd = False
  495. def __init__(self, mode, *args):
  496. self.im = None
  497. self.state = PyCodecState()
  498. self.fd = None
  499. self.mode = mode
  500. self.init(args)
  501. def init(self, args):
  502. """
  503. Override to perform decoder specific initialization
  504. :param args: Array of args items from the tile entry
  505. :returns: None
  506. """
  507. self.args = args
  508. @property
  509. def pulls_fd(self):
  510. return self._pulls_fd
  511. def decode(self, buffer):
  512. """
  513. Override to perform the decoding process.
  514. :param buffer: A bytes object with the data to be decoded.
  515. :returns: A tuple of ``(bytes consumed, errcode)``.
  516. If finished with decoding return <0 for the bytes consumed.
  517. Err codes are from :data:`.ImageFile.ERRORS`.
  518. """
  519. raise NotImplementedError()
  520. def cleanup(self):
  521. """
  522. Override to perform decoder specific cleanup
  523. :returns: None
  524. """
  525. pass
  526. def setfd(self, fd):
  527. """
  528. Called from ImageFile to set the python file-like object
  529. :param fd: A python file-like object
  530. :returns: None
  531. """
  532. self.fd = fd
  533. def setimage(self, im, extents=None):
  534. """
  535. Called from ImageFile to set the core output image for the decoder
  536. :param im: A core image object
  537. :param extents: a 4 tuple of (x0, y0, x1, y1) defining the rectangle
  538. for this tile
  539. :returns: None
  540. """
  541. # following c code
  542. self.im = im
  543. if extents:
  544. (x0, y0, x1, y1) = extents
  545. else:
  546. (x0, y0, x1, y1) = (0, 0, 0, 0)
  547. if x0 == 0 and x1 == 0:
  548. self.state.xsize, self.state.ysize = self.im.size
  549. else:
  550. self.state.xoff = x0
  551. self.state.yoff = y0
  552. self.state.xsize = x1 - x0
  553. self.state.ysize = y1 - y0
  554. if self.state.xsize <= 0 or self.state.ysize <= 0:
  555. raise ValueError("Size cannot be negative")
  556. if (
  557. self.state.xsize + self.state.xoff > self.im.size[0]
  558. or self.state.ysize + self.state.yoff > self.im.size[1]
  559. ):
  560. raise ValueError("Tile cannot extend outside image")
  561. def set_as_raw(self, data, rawmode=None):
  562. """
  563. Convenience method to set the internal image from a stream of raw data
  564. :param data: Bytes to be set
  565. :param rawmode: The rawmode to be used for the decoder.
  566. If not specified, it will default to the mode of the image
  567. :returns: None
  568. """
  569. if not rawmode:
  570. rawmode = self.mode
  571. d = Image._getdecoder(self.mode, "raw", (rawmode))
  572. d.setimage(self.im, self.state.extents())
  573. s = d.decode(data)
  574. if s[0] >= 0:
  575. raise ValueError("not enough image data")
  576. if s[1] != 0:
  577. raise ValueError("cannot decode image data")