Jpeg2KImagePlugin.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408
  1. #
  2. # The Python Imaging Library
  3. # $Id$
  4. #
  5. # JPEG2000 file handling
  6. #
  7. # History:
  8. # 2014-03-12 ajh Created
  9. # 2021-06-30 rogermb Extract dpi information from the 'resc' header box
  10. #
  11. # Copyright (c) 2014 Coriolis Systems Limited
  12. # Copyright (c) 2014 Alastair Houghton
  13. #
  14. # See the README file for information on usage and redistribution.
  15. #
  16. from __future__ import annotations
  17. import io
  18. import os
  19. import struct
  20. from typing import IO, Tuple, cast
  21. from . import Image, ImageFile, ImagePalette, _binary
  22. class BoxReader:
  23. """
  24. A small helper class to read fields stored in JPEG2000 header boxes
  25. and to easily step into and read sub-boxes.
  26. """
  27. def __init__(self, fp, length=-1):
  28. self.fp = fp
  29. self.has_length = length >= 0
  30. self.length = length
  31. self.remaining_in_box = -1
  32. def _can_read(self, num_bytes: int) -> bool:
  33. if self.has_length and self.fp.tell() + num_bytes > self.length:
  34. # Outside box: ensure we don't read past the known file length
  35. return False
  36. if self.remaining_in_box >= 0:
  37. # Inside box contents: ensure read does not go past box boundaries
  38. return num_bytes <= self.remaining_in_box
  39. else:
  40. return True # No length known, just read
  41. def _read_bytes(self, num_bytes: int) -> bytes:
  42. if not self._can_read(num_bytes):
  43. msg = "Not enough data in header"
  44. raise SyntaxError(msg)
  45. data = self.fp.read(num_bytes)
  46. if len(data) < num_bytes:
  47. msg = f"Expected to read {num_bytes} bytes but only got {len(data)}."
  48. raise OSError(msg)
  49. if self.remaining_in_box > 0:
  50. self.remaining_in_box -= num_bytes
  51. return data
  52. def read_fields(self, field_format: str) -> tuple[int | bytes, ...]:
  53. size = struct.calcsize(field_format)
  54. data = self._read_bytes(size)
  55. return struct.unpack(field_format, data)
  56. def read_boxes(self) -> BoxReader:
  57. size = self.remaining_in_box
  58. data = self._read_bytes(size)
  59. return BoxReader(io.BytesIO(data), size)
  60. def has_next_box(self) -> bool:
  61. if self.has_length:
  62. return self.fp.tell() + self.remaining_in_box < self.length
  63. else:
  64. return True
  65. def next_box_type(self) -> bytes:
  66. # Skip the rest of the box if it has not been read
  67. if self.remaining_in_box > 0:
  68. self.fp.seek(self.remaining_in_box, os.SEEK_CUR)
  69. self.remaining_in_box = -1
  70. # Read the length and type of the next box
  71. lbox, tbox = cast(Tuple[int, bytes], self.read_fields(">I4s"))
  72. if lbox == 1:
  73. lbox = cast(int, self.read_fields(">Q")[0])
  74. hlen = 16
  75. else:
  76. hlen = 8
  77. if lbox < hlen or not self._can_read(lbox - hlen):
  78. msg = "Invalid header length"
  79. raise SyntaxError(msg)
  80. self.remaining_in_box = lbox - hlen
  81. return tbox
  82. def _parse_codestream(fp) -> tuple[tuple[int, int], str]:
  83. """Parse the JPEG 2000 codestream to extract the size and component
  84. count from the SIZ marker segment, returning a PIL (size, mode) tuple."""
  85. hdr = fp.read(2)
  86. lsiz = _binary.i16be(hdr)
  87. siz = hdr + fp.read(lsiz - 2)
  88. lsiz, rsiz, xsiz, ysiz, xosiz, yosiz, _, _, _, _, csiz = struct.unpack_from(
  89. ">HHIIIIIIIIH", siz
  90. )
  91. size = (xsiz - xosiz, ysiz - yosiz)
  92. if csiz == 1:
  93. ssiz = struct.unpack_from(">B", siz, 38)
  94. if (ssiz[0] & 0x7F) + 1 > 8:
  95. mode = "I;16"
  96. else:
  97. mode = "L"
  98. elif csiz == 2:
  99. mode = "LA"
  100. elif csiz == 3:
  101. mode = "RGB"
  102. elif csiz == 4:
  103. mode = "RGBA"
  104. else:
  105. msg = "unable to determine J2K image mode"
  106. raise SyntaxError(msg)
  107. return size, mode
  108. def _res_to_dpi(num: int, denom: int, exp: int) -> float | None:
  109. """Convert JPEG2000's (numerator, denominator, exponent-base-10) resolution,
  110. calculated as (num / denom) * 10^exp and stored in dots per meter,
  111. to floating-point dots per inch."""
  112. if denom == 0:
  113. return None
  114. return (254 * num * (10**exp)) / (10000 * denom)
  115. def _parse_jp2_header(fp):
  116. """Parse the JP2 header box to extract size, component count,
  117. color space information, and optionally DPI information,
  118. returning a (size, mode, mimetype, dpi) tuple."""
  119. # Find the JP2 header box
  120. reader = BoxReader(fp)
  121. header = None
  122. mimetype = None
  123. while reader.has_next_box():
  124. tbox = reader.next_box_type()
  125. if tbox == b"jp2h":
  126. header = reader.read_boxes()
  127. break
  128. elif tbox == b"ftyp":
  129. if reader.read_fields(">4s")[0] == b"jpx ":
  130. mimetype = "image/jpx"
  131. size = None
  132. mode = None
  133. bpc = None
  134. nc = None
  135. dpi = None # 2-tuple of DPI info, or None
  136. palette = None
  137. while header.has_next_box():
  138. tbox = header.next_box_type()
  139. if tbox == b"ihdr":
  140. height, width, nc, bpc = header.read_fields(">IIHB")
  141. size = (width, height)
  142. if nc == 1 and (bpc & 0x7F) > 8:
  143. mode = "I;16"
  144. elif nc == 1:
  145. mode = "L"
  146. elif nc == 2:
  147. mode = "LA"
  148. elif nc == 3:
  149. mode = "RGB"
  150. elif nc == 4:
  151. mode = "RGBA"
  152. elif tbox == b"colr" and nc == 4:
  153. meth, _, _, enumcs = header.read_fields(">BBBI")
  154. if meth == 1 and enumcs == 12:
  155. mode = "CMYK"
  156. elif tbox == b"pclr" and mode in ("L", "LA"):
  157. ne, npc = header.read_fields(">HB")
  158. bitdepths = header.read_fields(">" + ("B" * npc))
  159. if max(bitdepths) <= 8:
  160. palette = ImagePalette.ImagePalette()
  161. for i in range(ne):
  162. palette.getcolor(header.read_fields(">" + ("B" * npc)))
  163. mode = "P" if mode == "L" else "PA"
  164. elif tbox == b"res ":
  165. res = header.read_boxes()
  166. while res.has_next_box():
  167. tres = res.next_box_type()
  168. if tres == b"resc":
  169. vrcn, vrcd, hrcn, hrcd, vrce, hrce = res.read_fields(">HHHHBB")
  170. hres = _res_to_dpi(hrcn, hrcd, hrce)
  171. vres = _res_to_dpi(vrcn, vrcd, vrce)
  172. if hres is not None and vres is not None:
  173. dpi = (hres, vres)
  174. break
  175. if size is None or mode is None:
  176. msg = "Malformed JP2 header"
  177. raise SyntaxError(msg)
  178. return size, mode, mimetype, dpi, palette
  179. ##
  180. # Image plugin for JPEG2000 images.
  181. class Jpeg2KImageFile(ImageFile.ImageFile):
  182. format = "JPEG2000"
  183. format_description = "JPEG 2000 (ISO 15444)"
  184. def _open(self) -> None:
  185. sig = self.fp.read(4)
  186. if sig == b"\xff\x4f\xff\x51":
  187. self.codec = "j2k"
  188. self._size, self._mode = _parse_codestream(self.fp)
  189. else:
  190. sig = sig + self.fp.read(8)
  191. if sig == b"\x00\x00\x00\x0cjP \x0d\x0a\x87\x0a":
  192. self.codec = "jp2"
  193. header = _parse_jp2_header(self.fp)
  194. self._size, self._mode, self.custom_mimetype, dpi, self.palette = header
  195. if dpi is not None:
  196. self.info["dpi"] = dpi
  197. if self.fp.read(12).endswith(b"jp2c\xff\x4f\xff\x51"):
  198. self._parse_comment()
  199. else:
  200. msg = "not a JPEG 2000 file"
  201. raise SyntaxError(msg)
  202. self._reduce = 0
  203. self.layers = 0
  204. fd = -1
  205. length = -1
  206. try:
  207. fd = self.fp.fileno()
  208. length = os.fstat(fd).st_size
  209. except Exception:
  210. fd = -1
  211. try:
  212. pos = self.fp.tell()
  213. self.fp.seek(0, io.SEEK_END)
  214. length = self.fp.tell()
  215. self.fp.seek(pos)
  216. except Exception:
  217. length = -1
  218. self.tile = [
  219. (
  220. "jpeg2k",
  221. (0, 0) + self.size,
  222. 0,
  223. (self.codec, self._reduce, self.layers, fd, length),
  224. )
  225. ]
  226. def _parse_comment(self) -> None:
  227. hdr = self.fp.read(2)
  228. length = _binary.i16be(hdr)
  229. self.fp.seek(length - 2, os.SEEK_CUR)
  230. while True:
  231. marker = self.fp.read(2)
  232. if not marker:
  233. break
  234. typ = marker[1]
  235. if typ in (0x90, 0xD9):
  236. # Start of tile or end of codestream
  237. break
  238. hdr = self.fp.read(2)
  239. length = _binary.i16be(hdr)
  240. if typ == 0x64:
  241. # Comment
  242. self.info["comment"] = self.fp.read(length - 2)[2:]
  243. break
  244. else:
  245. self.fp.seek(length - 2, os.SEEK_CUR)
  246. @property
  247. def reduce(self):
  248. # https://github.com/python-pillow/Pillow/issues/4343 found that the
  249. # new Image 'reduce' method was shadowed by this plugin's 'reduce'
  250. # property. This attempts to allow for both scenarios
  251. return self._reduce or super().reduce
  252. @reduce.setter
  253. def reduce(self, value):
  254. self._reduce = value
  255. def load(self):
  256. if self.tile and self._reduce:
  257. power = 1 << self._reduce
  258. adjust = power >> 1
  259. self._size = (
  260. int((self.size[0] + adjust) / power),
  261. int((self.size[1] + adjust) / power),
  262. )
  263. # Update the reduce and layers settings
  264. t = self.tile[0]
  265. t3 = (t[3][0], self._reduce, self.layers, t[3][3], t[3][4])
  266. self.tile = [(t[0], (0, 0) + self.size, t[2], t3)]
  267. return ImageFile.ImageFile.load(self)
  268. def _accept(prefix: bytes) -> bool:
  269. return (
  270. prefix[:4] == b"\xff\x4f\xff\x51"
  271. or prefix[:12] == b"\x00\x00\x00\x0cjP \x0d\x0a\x87\x0a"
  272. )
  273. # ------------------------------------------------------------
  274. # Save support
  275. def _save(im: Image.Image, fp: IO[bytes], filename: str | bytes) -> None:
  276. # Get the keyword arguments
  277. info = im.encoderinfo
  278. if isinstance(filename, str):
  279. filename = filename.encode()
  280. if filename.endswith(b".j2k") or info.get("no_jp2", False):
  281. kind = "j2k"
  282. else:
  283. kind = "jp2"
  284. offset = info.get("offset", None)
  285. tile_offset = info.get("tile_offset", None)
  286. tile_size = info.get("tile_size", None)
  287. quality_mode = info.get("quality_mode", "rates")
  288. quality_layers = info.get("quality_layers", None)
  289. if quality_layers is not None and not (
  290. isinstance(quality_layers, (list, tuple))
  291. and all(
  292. isinstance(quality_layer, (int, float)) for quality_layer in quality_layers
  293. )
  294. ):
  295. msg = "quality_layers must be a sequence of numbers"
  296. raise ValueError(msg)
  297. num_resolutions = info.get("num_resolutions", 0)
  298. cblk_size = info.get("codeblock_size", None)
  299. precinct_size = info.get("precinct_size", None)
  300. irreversible = info.get("irreversible", False)
  301. progression = info.get("progression", "LRCP")
  302. cinema_mode = info.get("cinema_mode", "no")
  303. mct = info.get("mct", 0)
  304. signed = info.get("signed", False)
  305. comment = info.get("comment")
  306. if isinstance(comment, str):
  307. comment = comment.encode()
  308. plt = info.get("plt", False)
  309. fd = -1
  310. if hasattr(fp, "fileno"):
  311. try:
  312. fd = fp.fileno()
  313. except Exception:
  314. fd = -1
  315. im.encoderconfig = (
  316. offset,
  317. tile_offset,
  318. tile_size,
  319. quality_mode,
  320. quality_layers,
  321. num_resolutions,
  322. cblk_size,
  323. precinct_size,
  324. irreversible,
  325. progression,
  326. cinema_mode,
  327. mct,
  328. signed,
  329. fd,
  330. comment,
  331. plt,
  332. )
  333. ImageFile._save(im, fp, [("jpeg2k", (0, 0) + im.size, 0, kind)])
  334. # ------------------------------------------------------------
  335. # Registry stuff
  336. Image.register_open(Jpeg2KImageFile.format, Jpeg2KImageFile, _accept)
  337. Image.register_save(Jpeg2KImageFile.format, _save)
  338. Image.register_extensions(
  339. Jpeg2KImageFile.format, [".jp2", ".j2k", ".jpc", ".jpf", ".jpx", ".j2c"]
  340. )
  341. Image.register_mime(Jpeg2KImageFile.format, "image/jp2")