Pillow/src/PIL/PpmImagePlugin.py

349 lines
12 KiB
Python
Raw Normal View History

2010-07-31 06:52:47 +04:00
#
# The Python Imaging Library.
# $Id$
#
# PPM support for PIL
#
# History:
# 96-03-24 fl Created
# 98-03-06 fl Write RGBA images (as RGB, that is)
#
# Copyright (c) Secret Labs AB 1997-98.
# Copyright (c) Fredrik Lundh 1996.
#
# See the README file for information on usage and redistribution.
#
from . import Image, ImageFile
2022-03-09 14:29:45 +03:00
from ._binary import i16be as i16
from ._binary import o8
from ._binary import o32le as o32
2010-07-31 06:52:47 +04:00
#
# --------------------------------------------------------------------
b_whitespace = b"\x20\x09\x0a\x0b\x0c\x0d"
2010-07-31 06:52:47 +04:00
MODES = {
2022-03-12 09:32:15 +03:00
# standard
b"P1": "1",
b"P2": "L",
b"P3": "RGB",
b"P4": "1",
b"P5": "L",
b"P6": "RGB",
2010-07-31 06:52:47 +04:00
# extensions
2022-03-12 09:32:15 +03:00
b"P0CMYK": "CMYK",
2010-07-31 06:52:47 +04:00
# PIL extensions (for test purposes only)
2022-03-12 09:32:15 +03:00
b"PyP": "P",
b"PyRGBA": "RGBA",
b"PyCMYK": "CMYK",
2010-07-31 06:52:47 +04:00
}
2014-08-26 17:47:10 +04:00
2010-07-31 06:52:47 +04:00
def _accept(prefix):
2021-01-09 07:33:29 +03:00
return prefix[0:1] == b"P" and prefix[1] in b"0123456y"
2010-07-31 06:52:47 +04:00
2014-08-26 17:47:10 +04:00
2010-07-31 06:52:47 +04:00
##
# Image plugin for PBM, PGM, and PPM images.
2019-03-21 16:28:20 +03:00
2010-07-31 06:52:47 +04:00
class PpmImageFile(ImageFile.ImageFile):
format = "PPM"
format_description = "Pbmplus image"
def _read_magic(self):
magic = b""
# read until whitespace or longest available magic number
for _ in range(6):
2021-01-04 07:49:19 +03:00
c = self.fp.read(1)
if not c or c in b_whitespace:
2021-01-04 07:49:19 +03:00
break
magic += c
return magic
2021-01-04 07:49:19 +03:00
def _read_token(self):
token = b""
while len(token) <= 10: # read until next whitespace or limit of 10 characters
2020-12-21 06:56:30 +03:00
c = self.fp.read(1)
if not c:
2010-07-31 06:52:47 +04:00
break
elif c in b_whitespace: # token ended
if not token:
# skip whitespace at start
continue
break
elif c == b"#":
# ignores rest of the line; stops at CR, LF or EOF
while self.fp.read(1) not in b"\r\n":
pass
continue
2020-12-21 06:56:30 +03:00
token += c
if not token:
# Token was not even 1 byte
raise ValueError("Reached EOF while reading header")
elif len(token) > 10:
raise ValueError(f"Token too long in file header: {token.decode()}")
2020-12-21 06:56:30 +03:00
return token
2010-07-31 06:52:47 +04:00
def _open(self):
2021-01-04 07:49:19 +03:00
magic_number = self._read_magic()
try:
2022-03-12 09:32:15 +03:00
mode = MODES[magic_number]
2021-01-04 07:49:19 +03:00
except KeyError:
raise SyntaxError("not a PPM file")
2019-03-04 10:17:12 +03:00
2022-03-12 09:32:15 +03:00
if magic_number in (b"P1", b"P4"):
self.custom_mimetype = "image/x-portable-bitmap"
elif magic_number in (b"P2", b"P5"):
self.custom_mimetype = "image/x-portable-graymap"
elif magic_number in (b"P3", b"P6"):
self.custom_mimetype = "image/x-portable-pixmap"
2010-07-31 06:52:47 +04:00
maxval = None
2022-03-09 14:29:45 +03:00
decoder_name = "raw"
2010-07-31 06:52:47 +04:00
for ix in range(3):
2022-03-04 04:13:08 +03:00
token = int(self._read_token())
2020-12-21 06:56:30 +03:00
if ix == 0: # token is the x size
xsize = token
elif ix == 1: # token is the y size
ysize = token
2010-07-31 06:52:47 +04:00
if mode == "1":
2021-01-09 07:33:29 +03:00
self.mode = "1"
rawmode = "1;I"
2010-07-31 06:52:47 +04:00
break
2021-01-09 07:33:29 +03:00
else:
self.mode = rawmode = mode
2020-12-21 06:56:30 +03:00
elif ix == 2: # token is maxval
2021-01-31 06:51:39 +03:00
maxval = token
2022-04-30 03:37:50 +03:00
if not 0 < maxval < 65536:
raise ValueError(
"maxval must be greater than 0 and less than 65536"
)
2022-03-09 14:29:45 +03:00
if maxval > 255 and mode == "L":
self.mode = "I"
2022-03-10 01:55:47 +03:00
# If maxval matches a bit depth, use the raw decoder directly
2022-03-09 14:29:45 +03:00
if maxval == 65535 and mode == "L":
rawmode = "I;16B"
elif maxval != 255:
decoder_name = "ppm"
2014-08-26 17:47:10 +04:00
2022-03-12 09:32:15 +03:00
if magic_number in (b"P1", b"P2", b"P3"):
decoder_name = "ppm_plain"
args = (rawmode, 0, 1) if decoder_name == "raw" else (rawmode, maxval)
self._size = xsize, ysize
self.tile = [(decoder_name, (0, 0, xsize, ysize), self.fp.tell(), args)]
2010-07-31 06:52:47 +04:00
2014-08-26 17:47:10 +04:00
2010-07-31 06:52:47 +04:00
#
# --------------------------------------------------------------------
2019-03-21 16:28:20 +03:00
2021-01-16 22:52:40 +03:00
class PpmPlainDecoder(ImageFile.PyDecoder):
_pulls_fd = True
2022-03-12 09:32:15 +03:00
def _read_block(self):
return self.fd.read(ImageFile.SAFEBLOCK)
2021-01-16 22:52:40 +03:00
def _find_comment_end(self, block, start=0):
a = block.find(b"\n", start)
b = block.find(b"\r", start)
return min(a, b) if a * b > 0 else max(a, b) # lowest nonnegative index (or -1)
def _ignore_comments(self, block):
"""
2022-03-12 09:32:15 +03:00
Deletes comments from block.
If comment does not end in this block, raises a flag.
2021-01-16 22:52:40 +03:00
"""
comment_spans = False
while True:
comment_start = block.find(b"#") # look for next comment
if comment_start == -1: # no comment found
break
comment_end = self._find_comment_end(block, comment_start)
if comment_end != -1: # comment ends in this block
2022-03-12 09:32:15 +03:00
# delete comment
block = block[:comment_start] + block[comment_end + 1 :]
2021-01-16 22:52:40 +03:00
else: # last comment continues to next block(s)
block = block[:comment_start]
comment_spans = True
break
return block, comment_spans
def _decode_bitonal(self):
"""
2022-03-12 09:32:15 +03:00
This is a separate method because the plain PBM format all data tokens
are exactly one byte, and so the inter-token whitespace is optional.
2021-01-16 22:52:40 +03:00
"""
decoded_data = bytearray()
total_bytes = self.state.xsize * self.state.ysize
2021-01-16 22:52:40 +03:00
comment_spans = False
2022-03-13 05:36:26 +03:00
while len(decoded_data) != total_bytes:
2021-01-16 22:52:40 +03:00
block = self._read_block() # read next block
if not block:
# eof
break
2021-01-16 22:52:40 +03:00
while block and comment_spans:
comment_end = self._find_comment_end(block)
if comment_end != -1: # comment ends in this block
block = block[comment_end + 1 :] # delete tail of previous comment
comment_spans = False
2021-01-16 22:52:40 +03:00
else: # comment spans whole block
block = self._read_block()
block, comment_spans = self._ignore_comments(block)
tokens = b"".join(block.split())
for token in tokens:
2022-03-12 09:40:08 +03:00
if token not in (48, 49):
2021-01-16 22:52:40 +03:00
raise ValueError(f"Invalid token for this mode: {bytes([token])}")
2022-03-13 05:36:26 +03:00
decoded_data = (decoded_data + tokens)[:total_bytes]
invert = bytes.maketrans(b"01", b"\xFF\x00")
return decoded_data.translate(invert)
2021-01-16 22:52:40 +03:00
def _decode_blocks(self, channels, depth, maxval):
2021-01-16 22:53:24 +03:00
decoded_data = bytearray()
max_len = 10
bytes_per_sample = depth // 8
total_bytes = self.state.xsize * self.state.ysize * channels * bytes_per_sample
2021-01-16 22:53:24 +03:00
comment_spans = False
half_token = False
2022-03-13 05:36:26 +03:00
while len(decoded_data) != total_bytes:
2021-01-16 22:53:24 +03:00
block = self._read_block() # read next block
if not block:
2022-03-12 09:40:08 +03:00
if half_token:
2021-01-16 22:53:24 +03:00
block = bytearray(b" ") # flush half_token
else:
# eof
break
2021-01-16 22:53:24 +03:00
while block and comment_spans:
comment_end = self._find_comment_end(block)
if comment_end != -1: # comment ends in this block
block = block[comment_end + 1 :] # delete tail of previous comment
break
else: # comment spans whole block
block = self._read_block()
block, comment_spans = self._ignore_comments(block)
2022-03-12 09:40:08 +03:00
if half_token:
2021-01-16 22:53:24 +03:00
block = half_token + block # stitch half_token to new block
tokens = block.split()
if block and not block[-1:].isspace(): # block might split token
half_token = tokens.pop() # save half token for later
if len(half_token) > max_len: # prevent buildup of half_token
raise ValueError(
f"Token too long found in data: {half_token[:max_len + 1]}"
)
for token in tokens:
if len(token) > max_len:
raise ValueError(
f"Token too long found in data: {token[:max_len + 1]}"
)
2022-03-12 09:44:32 +03:00
token = int(token)
2021-01-16 22:53:24 +03:00
if token > maxval:
raise ValueError(f"Channel value too large for this mode: {token}")
decoded_data += token.to_bytes(bytes_per_sample, "big")
2022-03-13 05:36:26 +03:00
if len(decoded_data) == total_bytes: # finished!
break
return decoded_data
2021-01-16 22:52:40 +03:00
def decode(self, buffer):
rawmode, maxval = self.args
2021-01-16 22:52:40 +03:00
if self.mode == "1":
decoded_data = self._decode_bitonal()
rawmode = "1;8"
elif self.mode == "L":
decoded_data = self._decode_blocks(1, 8, maxval)
2021-01-16 22:52:40 +03:00
elif self.mode == "I":
if rawmode == "I;16B":
decoded_data = self._decode_blocks(1, 16, maxval)
2021-01-16 22:52:40 +03:00
elif rawmode == "I;32B":
decoded_data = self._decode_blocks(1, 32, maxval)
2021-01-16 22:52:40 +03:00
elif self.mode == "RGB":
decoded_data = self._decode_blocks(3, 8, maxval)
2021-01-16 22:52:40 +03:00
self.set_as_raw(bytes(decoded_data), rawmode)
return -1, 0
2022-03-09 14:29:45 +03:00
class PpmDecoder(ImageFile.PyDecoder):
_pulls_fd = True
def decode(self, buffer):
data = bytearray()
maxval = min(self.args[-1], 65535)
in_byte_count = 1 if maxval < 256 else 2
out_byte_count = 4 if self.mode == "I" else 1
out_max = 65535 if self.mode == "I" else 255
bands = Image.getmodebands(self.mode)
while len(data) < self.state.xsize * self.state.ysize * bands * out_byte_count:
pixels = self.fd.read(in_byte_count * bands)
if len(pixels) < in_byte_count * bands:
# eof
break
for b in range(bands):
value = (
pixels[b] if in_byte_count == 1 else i16(pixels, b * in_byte_count)
)
value = min(out_max, round(value / maxval * out_max))
data += o32(value) if self.mode == "I" else o8(value)
2022-03-10 01:55:47 +03:00
rawmode = "I;32" if self.mode == "I" else self.mode
self.set_as_raw(bytes(data), (rawmode, 0, 1))
2022-03-09 14:29:45 +03:00
return -1, 0
2010-07-31 06:52:47 +04:00
2014-08-26 17:47:10 +04:00
2021-01-16 22:52:40 +03:00
#
# --------------------------------------------------------------------
2010-07-31 06:52:47 +04:00
def _save(im, fp, filename):
if im.mode == "1":
rawmode, head = "1;I", b"P4"
2010-07-31 06:52:47 +04:00
elif im.mode == "L":
rawmode, head = "L", b"P5"
2014-04-08 09:23:04 +04:00
elif im.mode == "I":
2022-03-10 01:55:47 +03:00
rawmode, head = "I;16B", b"P5"
elif im.mode in ("RGB", "RGBA"):
rawmode, head = "RGB", b"P6"
2010-07-31 06:52:47 +04:00
else:
raise OSError(f"cannot write mode {im.mode} as PPM")
2022-03-10 01:55:47 +03:00
fp.write(head + b"\n%d %d\n" % im.size)
2014-04-08 09:23:04 +04:00
if head == b"P6":
fp.write(b"255\n")
2022-03-09 14:29:45 +03:00
elif head == b"P5":
if rawmode == "L":
2014-04-08 09:23:04 +04:00
fp.write(b"255\n")
2022-03-10 01:55:47 +03:00
else:
2014-04-08 09:23:04 +04:00
fp.write(b"65535\n")
2019-03-21 16:28:20 +03:00
ImageFile._save(im, fp, [("raw", (0, 0) + im.size, 0, (rawmode, 0, 1))])
2010-07-31 06:52:47 +04:00
# ALTERNATIVE: save via builtin debug function
# im._dump(filename)
2019-03-21 16:28:20 +03:00
2010-07-31 06:52:47 +04:00
#
# --------------------------------------------------------------------
2021-03-21 06:33:05 +03:00
Image.register_decoder("ppm_plain", PpmPlainDecoder)
Image.register_open(PpmImageFile.format, PpmImageFile, _accept)
Image.register_save(PpmImageFile.format, _save)
2010-07-31 06:52:47 +04:00
2022-03-09 14:29:45 +03:00
Image.register_decoder("ppm", PpmDecoder)
Image.register_extensions(PpmImageFile.format, [".pbm", ".pgm", ".ppm", ".pnm"])
2019-03-04 10:17:12 +03:00
2019-03-06 00:06:19 +03:00
Image.register_mime(PpmImageFile.format, "image/x-portable-anymap")