mirror of
https://github.com/moparisthebest/SickRage
synced 2024-11-11 11:55:03 -05:00
114 lines
4.2 KiB
Python
114 lines
4.2 KiB
Python
|
"""
|
||
|
IPTC metadata parser (can be found in a JPEG picture for example)
|
||
|
|
||
|
Sources:
|
||
|
- Image-MetaData Perl module:
|
||
|
http://www.annocpan.org/~BETTELLI/Image-MetaData-JPEG-0.15/...
|
||
|
...lib/Image/MetaData/JPEG/TagLists.pod
|
||
|
- IPTC tag name and description:
|
||
|
http://peccatte.karefil.com/software/IPTCTableau.pdf
|
||
|
|
||
|
Author: Victor Stinner
|
||
|
"""
|
||
|
|
||
|
from lib.hachoir_core.field import (FieldSet, ParserError,
|
||
|
UInt8, UInt16, String, RawBytes, NullBytes)
|
||
|
from lib.hachoir_core.text_handler import textHandler, hexadecimal
|
||
|
|
||
|
def IPTC_String(parent, name, desc=None):
|
||
|
# Charset may be utf-8, ISO-8859-1, or ...
|
||
|
return String(parent, name, parent["size"].value, desc,
|
||
|
strip=" ")
|
||
|
|
||
|
dataset1 = {
|
||
|
}
|
||
|
dataset2 = {
|
||
|
0: ("record_version", "Record version (2 for JPEG)", UInt16),
|
||
|
5: ("obj_name", "Object name", None),
|
||
|
7: ("edit_stat", "Edit status", None),
|
||
|
10: ("urgency", "Urgency", UInt8),
|
||
|
15: ("category[]", "Category", None),
|
||
|
22: ("fixture", "Fixture identifier", IPTC_String),
|
||
|
25: ("keyword[]", "Keywords", IPTC_String),
|
||
|
30: ("release_date", "Release date", IPTC_String),
|
||
|
35: ("release_time", "Release time", IPTC_String),
|
||
|
40: ("instruction", "Special instructions", IPTC_String),
|
||
|
55: ("date_created", "Date created", IPTC_String),
|
||
|
60: ("time_created", "Time created (ISO 8601)", IPTC_String),
|
||
|
65: ("originating_prog", "Originating program", IPTC_String),
|
||
|
70: ("prog_ver", "Program version", IPTC_String),
|
||
|
80: ("author", "By-line (Author)", IPTC_String),
|
||
|
85: ("author_job", "By-line (Author precision)", IPTC_String),
|
||
|
90: ("city", "City", IPTC_String),
|
||
|
95: ("state", "Province / State", IPTC_String),
|
||
|
100: ("country_code", "Country / Primary location code", IPTC_String),
|
||
|
101: ("country_name", "Country / Primary location name", IPTC_String),
|
||
|
103: ("trans_ref", "Original transmission reference", IPTC_String),
|
||
|
105: ("headline", "Headline", IPTC_String),
|
||
|
110: ("credit", "Credit", IPTC_String),
|
||
|
115: ("source", "Source", IPTC_String),
|
||
|
116: ("copyright", "Copyright notice", IPTC_String),
|
||
|
120: ("caption", "Caption/Abstract", IPTC_String),
|
||
|
122: ("writer", "Writer/editor", IPTC_String),
|
||
|
231: ("history[]", "Document history (timestamp)", IPTC_String)
|
||
|
}
|
||
|
datasets = {1: dataset1, 2: dataset2}
|
||
|
|
||
|
class IPTC_Size(FieldSet):
|
||
|
def __init__(self, *args, **kw):
|
||
|
FieldSet.__init__(self, *args, **kw)
|
||
|
value = 0
|
||
|
for field in self:
|
||
|
value <<= 15
|
||
|
value += (field.value & 0x7fff)
|
||
|
self.createValue = lambda: value
|
||
|
|
||
|
def createFields(self):
|
||
|
while True:
|
||
|
field = UInt16(self, "value[]")
|
||
|
yield field
|
||
|
if field.value < 0x8000:
|
||
|
break
|
||
|
|
||
|
class IPTC_Chunk(FieldSet):
|
||
|
def __init__(self, *args, **kw):
|
||
|
FieldSet.__init__(self, *args, **kw)
|
||
|
number = self["dataset_nb"].value
|
||
|
self.dataset_info = None
|
||
|
if number in datasets:
|
||
|
tag = self["tag"].value
|
||
|
if tag in datasets[number]:
|
||
|
self.dataset_info = datasets[number][tag]
|
||
|
self._name = self.dataset_info[0]
|
||
|
self._description = self.dataset_info[1]
|
||
|
size_chunk = self["size"]
|
||
|
self._size = 3*8 + size_chunk.size + size_chunk.value*8
|
||
|
|
||
|
def createFields(self):
|
||
|
yield textHandler(UInt8(self, "signature", "IPTC signature (0x1c)"), hexadecimal)
|
||
|
if self["signature"].value != 0x1C:
|
||
|
raise ParserError("Wrong IPTC signature")
|
||
|
yield textHandler(UInt8(self, "dataset_nb", "Dataset number"), hexadecimal)
|
||
|
yield UInt8(self, "tag", "Tag")
|
||
|
yield IPTC_Size(self, "size", "Content size")
|
||
|
|
||
|
size = self["size"].value
|
||
|
if 0 < size:
|
||
|
if self.dataset_info:
|
||
|
cls = self.dataset_info[2]
|
||
|
else:
|
||
|
cls = None
|
||
|
if cls:
|
||
|
yield cls(self, "content")
|
||
|
else:
|
||
|
yield RawBytes(self, "content", size)
|
||
|
|
||
|
class IPTC(FieldSet):
|
||
|
def createFields(self):
|
||
|
while 5 <= (self._size - self.current_size)/8:
|
||
|
yield IPTC_Chunk(self, "chunk[]")
|
||
|
size = (self._size - self.current_size) / 8
|
||
|
if 0 < size:
|
||
|
yield NullBytes(self, "padding", size)
|
||
|
|