python 从Python 3中的10位DPX文件中读取元数据和图像数据

Posted

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了python 从Python 3中的10位DPX文件中读取元数据和图像数据相关的知识,希望对你有一定的参考价值。

"""
dpx.py

Read Metadata and Image data from 10-bit DPX files in Python 3

Copyright (c) 2016 Jack Doerner

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
""" 

import struct
import numpy as np

test_filename = "test.dpx"

orientations = {
	0: "Left to Right, Top to Bottom",
	1: "Right to Left, Top to Bottom",
	2: "Left to Right, Bottom to Top",
	3: "Right to Left, Bottom to Top",
	4: "Top to Bottom, Left to Right",
	5: "Top to Bottom, Right to Left",
	6: "Bottom to Top, Left to Right",
	7: "Bottom to Top, Right to Left"
}

descriptors = {
	1: "Red",
	2: "Green",
	3: "Blue",
	4: "Alpha",
	6: "Luma (Y)",
	7: "Color Difference",
	8: "Depth (Z)",
	9: "Composite Video",
	50: "RGB",
	51: "RGBA",
	52: "ABGR",
	100: "Cb, Y, Cr, Y (4:2:2)",
	102: "Cb, Y, Cr (4:4:4)",
	103: "Cb, Y, Cr, A (4:4:4:4)"
}

packings = {
	0: "Packed into 32-bit words",
	1: "Filled to 32-bit words, Padding First",
	2: "Filled to 32-bit words, Padding Last"
}

encodings = {
	0: "No encoding",
	1: "Run Length Encoding"
}

transfers = {
	1: "Printing Density",
	2: "Linear",
	3: "Logarithmic",
	4: "Unspecified Video",
	5: "SMPTE 274M",
	6: "ITU-R 709-4",
	7: "ITU-R 601-5 system B or G",
	8: "ITU-R 601-5 system M",
	9: "Composite Video (NTSC)",
	10: "Composite Video (PAL)",
	11: "Z (Linear Depth)",
	12: "Z (Homogenous Depth)"
}

colorimetries = {
	1: "Printing Density",
	4: "Unspecified Video",
	5: "SMPTE 274M",
	6: "ITU-R 709-4",
	7: "ITU-R 601-5 system B or G",
	8: "ITU-R 601-5 system M",
	9: "Composite Video (NTSC)",
	10: "Composite Video (PAL)"
}

propertymap = [
	#(field name, offset, length, type)

	('magic', 0, 4, 'magic'),
	('offset', 4, 4, 'I'),
	('dpx_version', 8, 8, 'utf8'),
	('file_size', 16, 4, 'I'),
	('ditto', 20, 4, 'I'),
	('filename', 36, 100, 'utf8'),
	('timestamp', 136, 24, 'utf8'),
	('creator', 160, 100, 'utf8'),
	('project_name', 260, 200, 'utf8'),
	('copyright', 460, 200, 'utf8'),
	('encryption_key', 660, 4, 'I'),

	('orientation', 768, 2, 'H'),
	('image_element_count', 770, 2, 'H'),
	('width', 772, 4, 'I'),
	('height', 776, 4, 'I'),

	('data_sign', 780, 4, 'I'),
	('descriptor', 800, 1, 'B'),
	('transfer_characteristic', 801, 1, 'B'),
	('colorimetry', 802, 1, 'B'),
	('depth', 803, 1, 'B'),
	('packing', 804, 2, 'H'),
	('encoding', 806, 2, 'H'),
	('line_padding', 812, 4, 'I'),
	('image_padding', 816, 4, 'I'),
	('image_element_description', 820, 32, 'utf8'),

	('input_device_name', 1556, 32, 'utf8'),
	('input_device_sn', 1588, 32, 'utf8')
]

def readDPXMetaData(f):
	f.seek(0)
	bytes = f.read(4)
	magic = bytes.decode(encoding='UTF-8')
	if magic != "SDPX" and magic != "XPDS":
		return None
	endianness = ">" if magic == "SDPX" else "<"

	meta = {}

	for p in propertymap:
		f.seek(p[1])
		bytes = f.read(p[2])
		if p[3] == 'magic':
			meta[p[0]] = bytes.decode(encoding='UTF-8')
			meta['endianness'] = "be" if magic == "SDPX" else "le"
		elif p[3] == 'utf8':
			meta[p[0]] = bytes.decode(encoding='UTF-8')
		elif p[3] == 'B':
			meta[p[0]] = struct.unpack(endianness + 'B', bytes)[0]
		elif p[3] == 'H':
			meta[p[0]] = struct.unpack(endianness + 'H', bytes)[0]
		elif p[3] == 'I':
			meta[p[0]] = struct.unpack(endianness + 'I', bytes)[0]

	return meta

def readDPXImageData(f, meta):
	if meta['depth'] != 10 or meta['packing'] != 1 or meta['encoding'] != 0 or meta['descriptor'] != 50:
		return None

	width = meta['width']
	height = meta['height']
	image = np.empty((height, width, 3), dtype=float)

	f.seek(meta['offset'])
	raw = np.fromfile(f, dtype=np.dtype(np.int32), count=width*height, sep="")
	raw = raw.reshape((height,width))

	if meta['endianness'] == 'be':
		raw = raw.byteswap()

	image[:,:,0] = (((raw >> 22) & 0x000003FF)/ 0x000003FF)
	image[:,:,1] = (((raw >> 12) & 0x000003FF)/ 0x000003FF)
	image[:,:,2] = (((raw >> 2) & 0x000003FF)/ 0x000003FF)

	return image

def writeDPX(f, image, meta):
	endianness = ">" if meta['endianness'] == 'be' else "<"
	for p in propertymap:
		if p[0] in meta:
			f.seek(p[1])
			if p[3] == 'magic':
				bytes = ('SDPX' if meta['endianness'] == 'be' else 'XPDS').encode(encoding='UTF-8')
			elif p[3] == 'utf8':
				bytes = meta[p[0]].encode(encoding='UTF-8')
			else:
				bytes = struct.pack(endianness + p[3], meta[p[0]])
			f.write(bytes)

	raw = ((((image[:,:,0] * 0x000003FF).astype(np.dtype(np.int32)) & 0x000003FF) << 22) 
			| (((image[:,:,1] * 0x000003FF).astype(np.dtype(np.int32)) & 0x000003FF) << 12)
			| (((image[:,:,2] * 0x000003FF).astype(np.dtype(np.int32)) & 0x000003FF) << 2)
		)

	if meta['endianness'] == 'be':
		raw = raw.byteswap()

	f.seek(meta['offset'])
	raw.tofile(f, sep="")

if __name__ == "__main__":
	with open(test_filename, "rb") as f:
		meta = readDPXMetaData(f)
		if meta is None:
			print("Invalid File")
		else:
			import binascii
			print("\nFILE INFORMATION HEADER")

			print("Endianness:","Big Endian" if meta['endianness'] == ">" else "Little Endian")
			print("Image Offset (Bytes):",meta['offset'])
			print("DPX Version:",meta['dpx_version'])
			print("File Size (Bytes):",meta['file_size'])
			print("Ditto Flag:","New Frame" if meta['ditto'] else "Same as Previous Frame")
			print("Image Filename:",meta['filename'])
			print("Creation Timestamp:",meta['timestamp'])
			print("Creator:",meta['creator'])
			print("Project Name:",meta['project_name'])
			print("Copyright:",meta['copyright'])
			print("Encryption Key:","Unencrypted" if meta['encryption_key'] == 0xFFFFFFFF else binascii.hexlify(bin(meta['encryption_key'])))


			print("\nIMAGE INFORMATION HEADER")
			print("Orientation:", orientations[meta['orientation']] if meta['orientation'] in orientations else "unknown")
			print("Image Element Count:", meta['image_element_count'])
			print("Width:", meta['width'])
			print("Height:", meta['height'])

			print("\nIMAGE ELEMENT 1")
			print("Data Sign:", "signed" if meta['data_sign'] == 1 else "unsigned")
			print("Descriptor:", descriptors[meta['descriptor']] if meta['descriptor'] in descriptors else "unknown")
			print("Transfer:",transfers[meta['transfer_characteristic']] if meta['transfer_characteristic'] in transfers else "unknown")
			print("Colorimetry:",colorimetries[meta['colorimetry']] if meta['colorimetry'] in colorimetries else "unknown")
			print("Bit Depth:",meta['depth'])
			print("Packing:",packings[meta['packing']] if meta['packing'] in packings else "unknown")
			print("Encoding:",encodings[meta['encoding']] if meta['encoding'] in encodings else "unknown")
			print("End of Line Padding:",meta['line_padding'])
			print("End of Image Padding:",meta['image_padding'])
			print("Image Element Description:",meta['image_element_description'])

			print("\nIMAGE SOURCE INFORMATION HEADER")
			print("Input Device Name:",meta['input_device_name'])
			print("Input Device Serial Number:",meta['input_device_sn'])

			print("\n")

			image = readDPXImageData(f, meta)

			if image is None:
				print("DPX Type not Implemented")
			else:
				from matplotlib import pyplot as plt
				plt.imshow(image, interpolation='nearest')
				plt.show()

以上是关于python 从Python 3中的10位DPX文件中读取元数据和图像数据的主要内容,如果未能解决你的问题,请参考以下文章

Python:读取 12 位二进制文​​件

如何从日期对象python获取以毫秒(秒后3位小数)为单位的时间值?

如何从python中的整数列中获取前4位数字

如何强制 Python 进入 64 位模式

Python 将一个值转换为 16 位 2 的补码

如何从python中的文本文档中删除所有标点符号和其他符号?