JpegImagePlugin.py 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888
  1. #
  2. # The Python Imaging Library.
  3. # $Id$
  4. #
  5. # JPEG (JFIF) file handling
  6. #
  7. # See "Digital Compression and Coding of Continuous-Tone Still Images,
  8. # Part 1, Requirements and Guidelines" (CCITT T.81 / ISO 10918-1)
  9. #
  10. # History:
  11. # 1995-09-09 fl Created
  12. # 1995-09-13 fl Added full parser
  13. # 1996-03-25 fl Added hack to use the IJG command line utilities
  14. # 1996-05-05 fl Workaround Photoshop 2.5 CMYK polarity bug
  15. # 1996-05-28 fl Added draft support, JFIF version (0.1)
  16. # 1996-12-30 fl Added encoder options, added progression property (0.2)
  17. # 1997-08-27 fl Save mode 1 images as BW (0.3)
  18. # 1998-07-12 fl Added YCbCr to draft and save methods (0.4)
  19. # 1998-10-19 fl Don't hang on files using 16-bit DQT's (0.4.1)
  20. # 2001-04-16 fl Extract DPI settings from JFIF files (0.4.2)
  21. # 2002-07-01 fl Skip pad bytes before markers; identify Exif files (0.4.3)
  22. # 2003-04-25 fl Added experimental EXIF decoder (0.5)
  23. # 2003-06-06 fl Added experimental EXIF GPSinfo decoder
  24. # 2003-09-13 fl Extract COM markers
  25. # 2009-09-06 fl Added icc_profile support (from Florian Hoech)
  26. # 2009-03-06 fl Changed CMYK handling; always use Adobe polarity (0.6)
  27. # 2009-03-08 fl Added subsampling support (from Justin Huff).
  28. #
  29. # Copyright (c) 1997-2003 by Secret Labs AB.
  30. # Copyright (c) 1995-1996 by Fredrik Lundh.
  31. #
  32. # See the README file for information on usage and redistribution.
  33. #
  34. from __future__ import annotations
  35. import array
  36. import io
  37. import math
  38. import os
  39. import struct
  40. import subprocess
  41. import sys
  42. import tempfile
  43. import warnings
  44. from . import Image, ImageFile
  45. from ._binary import i16be as i16
  46. from ._binary import i32be as i32
  47. from ._binary import o8
  48. from ._binary import o16be as o16
  49. from .JpegPresets import presets
  50. TYPE_CHECKING = False
  51. if TYPE_CHECKING:
  52. from typing import IO, Any
  53. from .MpoImagePlugin import MpoImageFile
  54. #
  55. # Parser
  56. def Skip(self: JpegImageFile, marker: int) -> None:
  57. n = i16(self.fp.read(2)) - 2
  58. ImageFile._safe_read(self.fp, n)
  59. def APP(self: JpegImageFile, marker: int) -> None:
  60. #
  61. # Application marker. Store these in the APP dictionary.
  62. # Also look for well-known application markers.
  63. n = i16(self.fp.read(2)) - 2
  64. s = ImageFile._safe_read(self.fp, n)
  65. app = f"APP{marker & 15}"
  66. self.app[app] = s # compatibility
  67. self.applist.append((app, s))
  68. if marker == 0xFFE0 and s.startswith(b"JFIF"):
  69. # extract JFIF information
  70. self.info["jfif"] = version = i16(s, 5) # version
  71. self.info["jfif_version"] = divmod(version, 256)
  72. # extract JFIF properties
  73. try:
  74. jfif_unit = s[7]
  75. jfif_density = i16(s, 8), i16(s, 10)
  76. except Exception:
  77. pass
  78. else:
  79. if jfif_unit == 1:
  80. self.info["dpi"] = jfif_density
  81. elif jfif_unit == 2: # cm
  82. # 1 dpcm = 2.54 dpi
  83. self.info["dpi"] = tuple(d * 2.54 for d in jfif_density)
  84. self.info["jfif_unit"] = jfif_unit
  85. self.info["jfif_density"] = jfif_density
  86. elif marker == 0xFFE1 and s.startswith(b"Exif\0\0"):
  87. # extract EXIF information
  88. if "exif" in self.info:
  89. self.info["exif"] += s[6:]
  90. else:
  91. self.info["exif"] = s
  92. self._exif_offset = self.fp.tell() - n + 6
  93. elif marker == 0xFFE1 and s.startswith(b"http://ns.adobe.com/xap/1.0/\x00"):
  94. self.info["xmp"] = s.split(b"\x00", 1)[1]
  95. elif marker == 0xFFE2 and s.startswith(b"FPXR\0"):
  96. # extract FlashPix information (incomplete)
  97. self.info["flashpix"] = s # FIXME: value will change
  98. elif marker == 0xFFE2 and s.startswith(b"ICC_PROFILE\0"):
  99. # Since an ICC profile can be larger than the maximum size of
  100. # a JPEG marker (64K), we need provisions to split it into
  101. # multiple markers. The format defined by the ICC specifies
  102. # one or more APP2 markers containing the following data:
  103. # Identifying string ASCII "ICC_PROFILE\0" (12 bytes)
  104. # Marker sequence number 1, 2, etc (1 byte)
  105. # Number of markers Total of APP2's used (1 byte)
  106. # Profile data (remainder of APP2 data)
  107. # Decoders should use the marker sequence numbers to
  108. # reassemble the profile, rather than assuming that the APP2
  109. # markers appear in the correct sequence.
  110. self.icclist.append(s)
  111. elif marker == 0xFFED and s.startswith(b"Photoshop 3.0\x00"):
  112. # parse the image resource block
  113. offset = 14
  114. photoshop = self.info.setdefault("photoshop", {})
  115. while s[offset : offset + 4] == b"8BIM":
  116. try:
  117. offset += 4
  118. # resource code
  119. code = i16(s, offset)
  120. offset += 2
  121. # resource name (usually empty)
  122. name_len = s[offset]
  123. # name = s[offset+1:offset+1+name_len]
  124. offset += 1 + name_len
  125. offset += offset & 1 # align
  126. # resource data block
  127. size = i32(s, offset)
  128. offset += 4
  129. data = s[offset : offset + size]
  130. if code == 0x03ED: # ResolutionInfo
  131. photoshop[code] = {
  132. "XResolution": i32(data, 0) / 65536,
  133. "DisplayedUnitsX": i16(data, 4),
  134. "YResolution": i32(data, 8) / 65536,
  135. "DisplayedUnitsY": i16(data, 12),
  136. }
  137. else:
  138. photoshop[code] = data
  139. offset += size
  140. offset += offset & 1 # align
  141. except struct.error:
  142. break # insufficient data
  143. elif marker == 0xFFEE and s.startswith(b"Adobe"):
  144. self.info["adobe"] = i16(s, 5)
  145. # extract Adobe custom properties
  146. try:
  147. adobe_transform = s[11]
  148. except IndexError:
  149. pass
  150. else:
  151. self.info["adobe_transform"] = adobe_transform
  152. elif marker == 0xFFE2 and s.startswith(b"MPF\0"):
  153. # extract MPO information
  154. self.info["mp"] = s[4:]
  155. # offset is current location minus buffer size
  156. # plus constant header size
  157. self.info["mpoffset"] = self.fp.tell() - n + 4
  158. def COM(self: JpegImageFile, marker: int) -> None:
  159. #
  160. # Comment marker. Store these in the APP dictionary.
  161. n = i16(self.fp.read(2)) - 2
  162. s = ImageFile._safe_read(self.fp, n)
  163. self.info["comment"] = s
  164. self.app["COM"] = s # compatibility
  165. self.applist.append(("COM", s))
  166. def SOF(self: JpegImageFile, marker: int) -> None:
  167. #
  168. # Start of frame marker. Defines the size and mode of the
  169. # image. JPEG is colour blind, so we use some simple
  170. # heuristics to map the number of layers to an appropriate
  171. # mode. Note that this could be made a bit brighter, by
  172. # looking for JFIF and Adobe APP markers.
  173. n = i16(self.fp.read(2)) - 2
  174. s = ImageFile._safe_read(self.fp, n)
  175. self._size = i16(s, 3), i16(s, 1)
  176. if self._im is not None and self.size != self.im.size:
  177. self._im = None
  178. self.bits = s[0]
  179. if self.bits != 8:
  180. msg = f"cannot handle {self.bits}-bit layers"
  181. raise SyntaxError(msg)
  182. self.layers = s[5]
  183. if self.layers == 1:
  184. self._mode = "L"
  185. elif self.layers == 3:
  186. self._mode = "RGB"
  187. elif self.layers == 4:
  188. self._mode = "CMYK"
  189. else:
  190. msg = f"cannot handle {self.layers}-layer images"
  191. raise SyntaxError(msg)
  192. if marker in [0xFFC2, 0xFFC6, 0xFFCA, 0xFFCE]:
  193. self.info["progressive"] = self.info["progression"] = 1
  194. if self.icclist:
  195. # fixup icc profile
  196. self.icclist.sort() # sort by sequence number
  197. if self.icclist[0][13] == len(self.icclist):
  198. profile = [p[14:] for p in self.icclist]
  199. icc_profile = b"".join(profile)
  200. else:
  201. icc_profile = None # wrong number of fragments
  202. self.info["icc_profile"] = icc_profile
  203. self.icclist = []
  204. for i in range(6, len(s), 3):
  205. t = s[i : i + 3]
  206. # 4-tuples: id, vsamp, hsamp, qtable
  207. self.layer.append((t[0], t[1] // 16, t[1] & 15, t[2]))
  208. def DQT(self: JpegImageFile, marker: int) -> None:
  209. #
  210. # Define quantization table. Note that there might be more
  211. # than one table in each marker.
  212. # FIXME: The quantization tables can be used to estimate the
  213. # compression quality.
  214. n = i16(self.fp.read(2)) - 2
  215. s = ImageFile._safe_read(self.fp, n)
  216. while len(s):
  217. v = s[0]
  218. precision = 1 if (v // 16 == 0) else 2 # in bytes
  219. qt_length = 1 + precision * 64
  220. if len(s) < qt_length:
  221. msg = "bad quantization table marker"
  222. raise SyntaxError(msg)
  223. data = array.array("B" if precision == 1 else "H", s[1:qt_length])
  224. if sys.byteorder == "little" and precision > 1:
  225. data.byteswap() # the values are always big-endian
  226. self.quantization[v & 15] = [data[i] for i in zigzag_index]
  227. s = s[qt_length:]
  228. #
  229. # JPEG marker table
  230. MARKER = {
  231. 0xFFC0: ("SOF0", "Baseline DCT", SOF),
  232. 0xFFC1: ("SOF1", "Extended Sequential DCT", SOF),
  233. 0xFFC2: ("SOF2", "Progressive DCT", SOF),
  234. 0xFFC3: ("SOF3", "Spatial lossless", SOF),
  235. 0xFFC4: ("DHT", "Define Huffman table", Skip),
  236. 0xFFC5: ("SOF5", "Differential sequential DCT", SOF),
  237. 0xFFC6: ("SOF6", "Differential progressive DCT", SOF),
  238. 0xFFC7: ("SOF7", "Differential spatial", SOF),
  239. 0xFFC8: ("JPG", "Extension", None),
  240. 0xFFC9: ("SOF9", "Extended sequential DCT (AC)", SOF),
  241. 0xFFCA: ("SOF10", "Progressive DCT (AC)", SOF),
  242. 0xFFCB: ("SOF11", "Spatial lossless DCT (AC)", SOF),
  243. 0xFFCC: ("DAC", "Define arithmetic coding conditioning", Skip),
  244. 0xFFCD: ("SOF13", "Differential sequential DCT (AC)", SOF),
  245. 0xFFCE: ("SOF14", "Differential progressive DCT (AC)", SOF),
  246. 0xFFCF: ("SOF15", "Differential spatial (AC)", SOF),
  247. 0xFFD0: ("RST0", "Restart 0", None),
  248. 0xFFD1: ("RST1", "Restart 1", None),
  249. 0xFFD2: ("RST2", "Restart 2", None),
  250. 0xFFD3: ("RST3", "Restart 3", None),
  251. 0xFFD4: ("RST4", "Restart 4", None),
  252. 0xFFD5: ("RST5", "Restart 5", None),
  253. 0xFFD6: ("RST6", "Restart 6", None),
  254. 0xFFD7: ("RST7", "Restart 7", None),
  255. 0xFFD8: ("SOI", "Start of image", None),
  256. 0xFFD9: ("EOI", "End of image", None),
  257. 0xFFDA: ("SOS", "Start of scan", Skip),
  258. 0xFFDB: ("DQT", "Define quantization table", DQT),
  259. 0xFFDC: ("DNL", "Define number of lines", Skip),
  260. 0xFFDD: ("DRI", "Define restart interval", Skip),
  261. 0xFFDE: ("DHP", "Define hierarchical progression", SOF),
  262. 0xFFDF: ("EXP", "Expand reference component", Skip),
  263. 0xFFE0: ("APP0", "Application segment 0", APP),
  264. 0xFFE1: ("APP1", "Application segment 1", APP),
  265. 0xFFE2: ("APP2", "Application segment 2", APP),
  266. 0xFFE3: ("APP3", "Application segment 3", APP),
  267. 0xFFE4: ("APP4", "Application segment 4", APP),
  268. 0xFFE5: ("APP5", "Application segment 5", APP),
  269. 0xFFE6: ("APP6", "Application segment 6", APP),
  270. 0xFFE7: ("APP7", "Application segment 7", APP),
  271. 0xFFE8: ("APP8", "Application segment 8", APP),
  272. 0xFFE9: ("APP9", "Application segment 9", APP),
  273. 0xFFEA: ("APP10", "Application segment 10", APP),
  274. 0xFFEB: ("APP11", "Application segment 11", APP),
  275. 0xFFEC: ("APP12", "Application segment 12", APP),
  276. 0xFFED: ("APP13", "Application segment 13", APP),
  277. 0xFFEE: ("APP14", "Application segment 14", APP),
  278. 0xFFEF: ("APP15", "Application segment 15", APP),
  279. 0xFFF0: ("JPG0", "Extension 0", None),
  280. 0xFFF1: ("JPG1", "Extension 1", None),
  281. 0xFFF2: ("JPG2", "Extension 2", None),
  282. 0xFFF3: ("JPG3", "Extension 3", None),
  283. 0xFFF4: ("JPG4", "Extension 4", None),
  284. 0xFFF5: ("JPG5", "Extension 5", None),
  285. 0xFFF6: ("JPG6", "Extension 6", None),
  286. 0xFFF7: ("JPG7", "Extension 7", None),
  287. 0xFFF8: ("JPG8", "Extension 8", None),
  288. 0xFFF9: ("JPG9", "Extension 9", None),
  289. 0xFFFA: ("JPG10", "Extension 10", None),
  290. 0xFFFB: ("JPG11", "Extension 11", None),
  291. 0xFFFC: ("JPG12", "Extension 12", None),
  292. 0xFFFD: ("JPG13", "Extension 13", None),
  293. 0xFFFE: ("COM", "Comment", COM),
  294. }
  295. def _accept(prefix: bytes) -> bool:
  296. # Magic number was taken from https://en.wikipedia.org/wiki/JPEG
  297. return prefix.startswith(b"\xff\xd8\xff")
  298. ##
  299. # Image plugin for JPEG and JFIF images.
  300. class JpegImageFile(ImageFile.ImageFile):
  301. format = "JPEG"
  302. format_description = "JPEG (ISO 10918)"
  303. def _open(self) -> None:
  304. s = self.fp.read(3)
  305. if not _accept(s):
  306. msg = "not a JPEG file"
  307. raise SyntaxError(msg)
  308. s = b"\xff"
  309. # Create attributes
  310. self.bits = self.layers = 0
  311. self._exif_offset = 0
  312. # JPEG specifics (internal)
  313. self.layer: list[tuple[int, int, int, int]] = []
  314. self._huffman_dc: dict[Any, Any] = {}
  315. self._huffman_ac: dict[Any, Any] = {}
  316. self.quantization: dict[int, list[int]] = {}
  317. self.app: dict[str, bytes] = {} # compatibility
  318. self.applist: list[tuple[str, bytes]] = []
  319. self.icclist: list[bytes] = []
  320. while True:
  321. i = s[0]
  322. if i == 0xFF:
  323. s = s + self.fp.read(1)
  324. i = i16(s)
  325. else:
  326. # Skip non-0xFF junk
  327. s = self.fp.read(1)
  328. continue
  329. if i in MARKER:
  330. name, description, handler = MARKER[i]
  331. if handler is not None:
  332. handler(self, i)
  333. if i == 0xFFDA: # start of scan
  334. rawmode = self.mode
  335. if self.mode == "CMYK":
  336. rawmode = "CMYK;I" # assume adobe conventions
  337. self.tile = [
  338. ImageFile._Tile("jpeg", (0, 0) + self.size, 0, (rawmode, ""))
  339. ]
  340. # self.__offset = self.fp.tell()
  341. break
  342. s = self.fp.read(1)
  343. elif i in {0, 0xFFFF}:
  344. # padded marker or junk; move on
  345. s = b"\xff"
  346. elif i == 0xFF00: # Skip extraneous data (escaped 0xFF)
  347. s = self.fp.read(1)
  348. else:
  349. msg = "no marker found"
  350. raise SyntaxError(msg)
  351. self._read_dpi_from_exif()
  352. def __getstate__(self) -> list[Any]:
  353. return super().__getstate__() + [self.layers, self.layer]
  354. def __setstate__(self, state: list[Any]) -> None:
  355. self.layers, self.layer = state[6:]
  356. super().__setstate__(state)
  357. def load_read(self, read_bytes: int) -> bytes:
  358. """
  359. internal: read more image data
  360. For premature EOF and LOAD_TRUNCATED_IMAGES adds EOI marker
  361. so libjpeg can finish decoding
  362. """
  363. s = self.fp.read(read_bytes)
  364. if not s and ImageFile.LOAD_TRUNCATED_IMAGES and not hasattr(self, "_ended"):
  365. # Premature EOF.
  366. # Pretend file is finished adding EOI marker
  367. self._ended = True
  368. return b"\xff\xd9"
  369. return s
  370. def draft(
  371. self, mode: str | None, size: tuple[int, int] | None
  372. ) -> tuple[str, tuple[int, int, float, float]] | None:
  373. if len(self.tile) != 1:
  374. return None
  375. # Protect from second call
  376. if self.decoderconfig:
  377. return None
  378. d, e, o, a = self.tile[0]
  379. scale = 1
  380. original_size = self.size
  381. assert isinstance(a, tuple)
  382. if a[0] == "RGB" and mode in ["L", "YCbCr"]:
  383. self._mode = mode
  384. a = mode, ""
  385. if size:
  386. scale = min(self.size[0] // size[0], self.size[1] // size[1])
  387. for s in [8, 4, 2, 1]:
  388. if scale >= s:
  389. break
  390. assert e is not None
  391. e = (
  392. e[0],
  393. e[1],
  394. (e[2] - e[0] + s - 1) // s + e[0],
  395. (e[3] - e[1] + s - 1) // s + e[1],
  396. )
  397. self._size = ((self.size[0] + s - 1) // s, (self.size[1] + s - 1) // s)
  398. scale = s
  399. self.tile = [ImageFile._Tile(d, e, o, a)]
  400. self.decoderconfig = (scale, 0)
  401. box = (0, 0, original_size[0] / scale, original_size[1] / scale)
  402. return self.mode, box
  403. def load_djpeg(self) -> None:
  404. # ALTERNATIVE: handle JPEGs via the IJG command line utilities
  405. f, path = tempfile.mkstemp()
  406. os.close(f)
  407. if os.path.exists(self.filename):
  408. subprocess.check_call(["djpeg", "-outfile", path, self.filename])
  409. else:
  410. try:
  411. os.unlink(path)
  412. except OSError:
  413. pass
  414. msg = "Invalid Filename"
  415. raise ValueError(msg)
  416. try:
  417. with Image.open(path) as _im:
  418. _im.load()
  419. self.im = _im.im
  420. finally:
  421. try:
  422. os.unlink(path)
  423. except OSError:
  424. pass
  425. self._mode = self.im.mode
  426. self._size = self.im.size
  427. self.tile = []
  428. def _getexif(self) -> dict[int, Any] | None:
  429. return _getexif(self)
  430. def _read_dpi_from_exif(self) -> None:
  431. # If DPI isn't in JPEG header, fetch from EXIF
  432. if "dpi" in self.info or "exif" not in self.info:
  433. return
  434. try:
  435. exif = self.getexif()
  436. resolution_unit = exif[0x0128]
  437. x_resolution = exif[0x011A]
  438. try:
  439. dpi = float(x_resolution[0]) / x_resolution[1]
  440. except TypeError:
  441. dpi = x_resolution
  442. if math.isnan(dpi):
  443. msg = "DPI is not a number"
  444. raise ValueError(msg)
  445. if resolution_unit == 3: # cm
  446. # 1 dpcm = 2.54 dpi
  447. dpi *= 2.54
  448. self.info["dpi"] = dpi, dpi
  449. except (
  450. struct.error, # truncated EXIF
  451. KeyError, # dpi not included
  452. SyntaxError, # invalid/unreadable EXIF
  453. TypeError, # dpi is an invalid float
  454. ValueError, # dpi is an invalid float
  455. ZeroDivisionError, # invalid dpi rational value
  456. ):
  457. self.info["dpi"] = 72, 72
  458. def _getmp(self) -> dict[int, Any] | None:
  459. return _getmp(self)
  460. def _getexif(self: JpegImageFile) -> dict[int, Any] | None:
  461. if "exif" not in self.info:
  462. return None
  463. return self.getexif()._get_merged_dict()
  464. def _getmp(self: JpegImageFile) -> dict[int, Any] | None:
  465. # Extract MP information. This method was inspired by the "highly
  466. # experimental" _getexif version that's been in use for years now,
  467. # itself based on the ImageFileDirectory class in the TIFF plugin.
  468. # The MP record essentially consists of a TIFF file embedded in a JPEG
  469. # application marker.
  470. try:
  471. data = self.info["mp"]
  472. except KeyError:
  473. return None
  474. file_contents = io.BytesIO(data)
  475. head = file_contents.read(8)
  476. endianness = ">" if head.startswith(b"\x4d\x4d\x00\x2a") else "<"
  477. # process dictionary
  478. from . import TiffImagePlugin
  479. try:
  480. info = TiffImagePlugin.ImageFileDirectory_v2(head)
  481. file_contents.seek(info.next)
  482. info.load(file_contents)
  483. mp = dict(info)
  484. except Exception as e:
  485. msg = "malformed MP Index (unreadable directory)"
  486. raise SyntaxError(msg) from e
  487. # it's an error not to have a number of images
  488. try:
  489. quant = mp[0xB001]
  490. except KeyError as e:
  491. msg = "malformed MP Index (no number of images)"
  492. raise SyntaxError(msg) from e
  493. # get MP entries
  494. mpentries = []
  495. try:
  496. rawmpentries = mp[0xB002]
  497. for entrynum in range(quant):
  498. unpackedentry = struct.unpack_from(
  499. f"{endianness}LLLHH", rawmpentries, entrynum * 16
  500. )
  501. labels = ("Attribute", "Size", "DataOffset", "EntryNo1", "EntryNo2")
  502. mpentry = dict(zip(labels, unpackedentry))
  503. mpentryattr = {
  504. "DependentParentImageFlag": bool(mpentry["Attribute"] & (1 << 31)),
  505. "DependentChildImageFlag": bool(mpentry["Attribute"] & (1 << 30)),
  506. "RepresentativeImageFlag": bool(mpentry["Attribute"] & (1 << 29)),
  507. "Reserved": (mpentry["Attribute"] & (3 << 27)) >> 27,
  508. "ImageDataFormat": (mpentry["Attribute"] & (7 << 24)) >> 24,
  509. "MPType": mpentry["Attribute"] & 0x00FFFFFF,
  510. }
  511. if mpentryattr["ImageDataFormat"] == 0:
  512. mpentryattr["ImageDataFormat"] = "JPEG"
  513. else:
  514. msg = "unsupported picture format in MPO"
  515. raise SyntaxError(msg)
  516. mptypemap = {
  517. 0x000000: "Undefined",
  518. 0x010001: "Large Thumbnail (VGA Equivalent)",
  519. 0x010002: "Large Thumbnail (Full HD Equivalent)",
  520. 0x020001: "Multi-Frame Image (Panorama)",
  521. 0x020002: "Multi-Frame Image: (Disparity)",
  522. 0x020003: "Multi-Frame Image: (Multi-Angle)",
  523. 0x030000: "Baseline MP Primary Image",
  524. }
  525. mpentryattr["MPType"] = mptypemap.get(mpentryattr["MPType"], "Unknown")
  526. mpentry["Attribute"] = mpentryattr
  527. mpentries.append(mpentry)
  528. mp[0xB002] = mpentries
  529. except KeyError as e:
  530. msg = "malformed MP Index (bad MP Entry)"
  531. raise SyntaxError(msg) from e
  532. # Next we should try and parse the individual image unique ID list;
  533. # we don't because I've never seen this actually used in a real MPO
  534. # file and so can't test it.
  535. return mp
  536. # --------------------------------------------------------------------
  537. # stuff to save JPEG files
  538. RAWMODE = {
  539. "1": "L",
  540. "L": "L",
  541. "RGB": "RGB",
  542. "RGBX": "RGB",
  543. "CMYK": "CMYK;I", # assume adobe conventions
  544. "YCbCr": "YCbCr",
  545. }
  546. # fmt: off
  547. zigzag_index = (
  548. 0, 1, 5, 6, 14, 15, 27, 28,
  549. 2, 4, 7, 13, 16, 26, 29, 42,
  550. 3, 8, 12, 17, 25, 30, 41, 43,
  551. 9, 11, 18, 24, 31, 40, 44, 53,
  552. 10, 19, 23, 32, 39, 45, 52, 54,
  553. 20, 22, 33, 38, 46, 51, 55, 60,
  554. 21, 34, 37, 47, 50, 56, 59, 61,
  555. 35, 36, 48, 49, 57, 58, 62, 63,
  556. )
  557. samplings = {
  558. (1, 1, 1, 1, 1, 1): 0,
  559. (2, 1, 1, 1, 1, 1): 1,
  560. (2, 2, 1, 1, 1, 1): 2,
  561. }
  562. # fmt: on
  563. def get_sampling(im: Image.Image) -> int:
  564. # There's no subsampling when images have only 1 layer
  565. # (grayscale images) or when they are CMYK (4 layers),
  566. # so set subsampling to the default value.
  567. #
  568. # NOTE: currently Pillow can't encode JPEG to YCCK format.
  569. # If YCCK support is added in the future, subsampling code will have
  570. # to be updated (here and in JpegEncode.c) to deal with 4 layers.
  571. if not isinstance(im, JpegImageFile) or im.layers in (1, 4):
  572. return -1
  573. sampling = im.layer[0][1:3] + im.layer[1][1:3] + im.layer[2][1:3]
  574. return samplings.get(sampling, -1)
  575. def _save(im: Image.Image, fp: IO[bytes], filename: str | bytes) -> None:
  576. if im.width == 0 or im.height == 0:
  577. msg = "cannot write empty image as JPEG"
  578. raise ValueError(msg)
  579. try:
  580. rawmode = RAWMODE[im.mode]
  581. except KeyError as e:
  582. msg = f"cannot write mode {im.mode} as JPEG"
  583. raise OSError(msg) from e
  584. info = im.encoderinfo
  585. dpi = [round(x) for x in info.get("dpi", (0, 0))]
  586. quality = info.get("quality", -1)
  587. subsampling = info.get("subsampling", -1)
  588. qtables = info.get("qtables")
  589. if quality == "keep":
  590. quality = -1
  591. subsampling = "keep"
  592. qtables = "keep"
  593. elif quality in presets:
  594. preset = presets[quality]
  595. quality = -1
  596. subsampling = preset.get("subsampling", -1)
  597. qtables = preset.get("quantization")
  598. elif not isinstance(quality, int):
  599. msg = "Invalid quality setting"
  600. raise ValueError(msg)
  601. else:
  602. if subsampling in presets:
  603. subsampling = presets[subsampling].get("subsampling", -1)
  604. if isinstance(qtables, str) and qtables in presets:
  605. qtables = presets[qtables].get("quantization")
  606. if subsampling == "4:4:4":
  607. subsampling = 0
  608. elif subsampling == "4:2:2":
  609. subsampling = 1
  610. elif subsampling == "4:2:0":
  611. subsampling = 2
  612. elif subsampling == "4:1:1":
  613. # For compatibility. Before Pillow 4.3, 4:1:1 actually meant 4:2:0.
  614. # Set 4:2:0 if someone is still using that value.
  615. subsampling = 2
  616. elif subsampling == "keep":
  617. if im.format != "JPEG":
  618. msg = "Cannot use 'keep' when original image is not a JPEG"
  619. raise ValueError(msg)
  620. subsampling = get_sampling(im)
  621. def validate_qtables(
  622. qtables: (
  623. str | tuple[list[int], ...] | list[list[int]] | dict[int, list[int]] | None
  624. ),
  625. ) -> list[list[int]] | None:
  626. if qtables is None:
  627. return qtables
  628. if isinstance(qtables, str):
  629. try:
  630. lines = [
  631. int(num)
  632. for line in qtables.splitlines()
  633. for num in line.split("#", 1)[0].split()
  634. ]
  635. except ValueError as e:
  636. msg = "Invalid quantization table"
  637. raise ValueError(msg) from e
  638. else:
  639. qtables = [lines[s : s + 64] for s in range(0, len(lines), 64)]
  640. if isinstance(qtables, (tuple, list, dict)):
  641. if isinstance(qtables, dict):
  642. qtables = [
  643. qtables[key] for key in range(len(qtables)) if key in qtables
  644. ]
  645. elif isinstance(qtables, tuple):
  646. qtables = list(qtables)
  647. if not (0 < len(qtables) < 5):
  648. msg = "None or too many quantization tables"
  649. raise ValueError(msg)
  650. for idx, table in enumerate(qtables):
  651. try:
  652. if len(table) != 64:
  653. msg = "Invalid quantization table"
  654. raise TypeError(msg)
  655. table_array = array.array("H", table)
  656. except TypeError as e:
  657. msg = "Invalid quantization table"
  658. raise ValueError(msg) from e
  659. else:
  660. qtables[idx] = list(table_array)
  661. return qtables
  662. if qtables == "keep":
  663. if im.format != "JPEG":
  664. msg = "Cannot use 'keep' when original image is not a JPEG"
  665. raise ValueError(msg)
  666. qtables = getattr(im, "quantization", None)
  667. qtables = validate_qtables(qtables)
  668. extra = info.get("extra", b"")
  669. MAX_BYTES_IN_MARKER = 65533
  670. if xmp := info.get("xmp"):
  671. overhead_len = 29 # b"http://ns.adobe.com/xap/1.0/\x00"
  672. max_data_bytes_in_marker = MAX_BYTES_IN_MARKER - overhead_len
  673. if len(xmp) > max_data_bytes_in_marker:
  674. msg = "XMP data is too long"
  675. raise ValueError(msg)
  676. size = o16(2 + overhead_len + len(xmp))
  677. extra += b"\xff\xe1" + size + b"http://ns.adobe.com/xap/1.0/\x00" + xmp
  678. if icc_profile := info.get("icc_profile"):
  679. overhead_len = 14 # b"ICC_PROFILE\0" + o8(i) + o8(len(markers))
  680. max_data_bytes_in_marker = MAX_BYTES_IN_MARKER - overhead_len
  681. markers = []
  682. while icc_profile:
  683. markers.append(icc_profile[:max_data_bytes_in_marker])
  684. icc_profile = icc_profile[max_data_bytes_in_marker:]
  685. i = 1
  686. for marker in markers:
  687. size = o16(2 + overhead_len + len(marker))
  688. extra += (
  689. b"\xff\xe2"
  690. + size
  691. + b"ICC_PROFILE\0"
  692. + o8(i)
  693. + o8(len(markers))
  694. + marker
  695. )
  696. i += 1
  697. comment = info.get("comment", im.info.get("comment"))
  698. # "progressive" is the official name, but older documentation
  699. # says "progression"
  700. # FIXME: issue a warning if the wrong form is used (post-1.1.7)
  701. progressive = info.get("progressive", False) or info.get("progression", False)
  702. optimize = info.get("optimize", False)
  703. exif = info.get("exif", b"")
  704. if isinstance(exif, Image.Exif):
  705. exif = exif.tobytes()
  706. if len(exif) > MAX_BYTES_IN_MARKER:
  707. msg = "EXIF data is too long"
  708. raise ValueError(msg)
  709. # get keyword arguments
  710. im.encoderconfig = (
  711. quality,
  712. progressive,
  713. info.get("smooth", 0),
  714. optimize,
  715. info.get("keep_rgb", False),
  716. info.get("streamtype", 0),
  717. dpi,
  718. subsampling,
  719. info.get("restart_marker_blocks", 0),
  720. info.get("restart_marker_rows", 0),
  721. qtables,
  722. comment,
  723. extra,
  724. exif,
  725. )
  726. # if we optimize, libjpeg needs a buffer big enough to hold the whole image
  727. # in a shot. Guessing on the size, at im.size bytes. (raw pixel size is
  728. # channels*size, this is a value that's been used in a django patch.
  729. # https://github.com/matthewwithanm/django-imagekit/issues/50
  730. if optimize or progressive:
  731. # CMYK can be bigger
  732. if im.mode == "CMYK":
  733. bufsize = 4 * im.size[0] * im.size[1]
  734. # keep sets quality to -1, but the actual value may be high.
  735. elif quality >= 95 or quality == -1:
  736. bufsize = 2 * im.size[0] * im.size[1]
  737. else:
  738. bufsize = im.size[0] * im.size[1]
  739. if exif:
  740. bufsize += len(exif) + 5
  741. if extra:
  742. bufsize += len(extra) + 1
  743. else:
  744. # The EXIF info needs to be written as one block, + APP1, + one spare byte.
  745. # Ensure that our buffer is big enough. Same with the icc_profile block.
  746. bufsize = max(len(exif) + 5, len(extra) + 1)
  747. ImageFile._save(
  748. im, fp, [ImageFile._Tile("jpeg", (0, 0) + im.size, 0, rawmode)], bufsize
  749. )
  750. ##
  751. # Factory for making JPEG and MPO instances
  752. def jpeg_factory(
  753. fp: IO[bytes], filename: str | bytes | None = None
  754. ) -> JpegImageFile | MpoImageFile:
  755. im = JpegImageFile(fp, filename)
  756. try:
  757. mpheader = im._getmp()
  758. if mpheader is not None and mpheader[45057] > 1:
  759. for segment, content in im.applist:
  760. if segment == "APP1" and b' hdrgm:Version="' in content:
  761. # Ultra HDR images are not yet supported
  762. return im
  763. # It's actually an MPO
  764. from .MpoImagePlugin import MpoImageFile
  765. # Don't reload everything, just convert it.
  766. im = MpoImageFile.adopt(im, mpheader)
  767. except (TypeError, IndexError):
  768. # It is really a JPEG
  769. pass
  770. except SyntaxError:
  771. warnings.warn(
  772. "Image appears to be a malformed MPO file, it will be "
  773. "interpreted as a base JPEG file"
  774. )
  775. return im
  776. # ---------------------------------------------------------------------
  777. # Registry stuff
  778. Image.register_open(JpegImageFile.format, jpeg_factory, _accept)
  779. Image.register_save(JpegImageFile.format, _save)
  780. Image.register_extensions(JpegImageFile.format, [".jfif", ".jpe", ".jpg", ".jpeg"])
  781. Image.register_mime(JpegImageFile.format, "image/jpeg")