2012-12-02 12:17:39 -08:00
|
|
|
"""
|
2015-02-12 14:57:46 -08:00
|
|
|
A python class to encapsulate CoMet data
|
2012-12-02 12:17:39 -08:00
|
|
|
"""
|
|
|
|
|
|
|
|
"""
|
2014-03-23 10:30:23 -07:00
|
|
|
Copyright 2012-2014 Anthony Beville
|
2012-12-02 12:17:39 -08:00
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
2015-02-12 14:57:46 -08:00
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
2012-12-02 12:17:39 -08:00
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
"""
|
|
|
|
|
|
|
|
from datetime import datetime
|
|
|
|
import zipfile
|
2015-02-12 14:57:46 -08:00
|
|
|
from pprint import pprint
|
2012-12-02 12:17:39 -08:00
|
|
|
import xml.etree.ElementTree as ET
|
2015-02-13 15:08:07 -08:00
|
|
|
|
2012-12-02 12:17:39 -08:00
|
|
|
from genericmetadata import GenericMetadata
|
|
|
|
import utils
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
|
2012-12-02 12:17:39 -08:00
|
|
|
class CoMet:
|
|
|
|
|
2015-02-12 14:57:46 -08:00
|
|
|
writer_synonyms = ['writer', 'plotter', 'scripter']
|
2015-02-15 02:44:00 -08:00
|
|
|
penciller_synonyms = ['artist', 'penciller', 'penciler', 'breakdowns']
|
|
|
|
inker_synonyms = ['inker', 'artist', 'finishes']
|
|
|
|
colorist_synonyms = ['colorist', 'colourist', 'colorer', 'colourer']
|
|
|
|
letterer_synonyms = ['letterer']
|
|
|
|
cover_synonyms = ['cover', 'covers', 'coverartist', 'cover artist']
|
|
|
|
editor_synonyms = ['editor']
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def metadataFromString(self, string):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
tree = ET.ElementTree(ET.fromstring(string))
|
|
|
|
return self.convertXMLToMetadata(tree)
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def stringFromMetadata(self, metadata):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
header = '<?xml version="1.0" encoding="UTF-8"?>\n'
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
tree = self.convertMetadataToXML(self, metadata)
|
2015-02-12 14:57:46 -08:00
|
|
|
return header + ET.tostring(tree.getroot())
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def indent(self, elem, level=0):
|
2015-02-12 14:57:46 -08:00
|
|
|
# for making the XML output readable
|
2015-02-15 02:44:00 -08:00
|
|
|
i = "\n" + level * " "
|
2015-02-12 14:57:46 -08:00
|
|
|
if len(elem):
|
|
|
|
if not elem.text or not elem.text.strip():
|
|
|
|
elem.text = i + " "
|
|
|
|
if not elem.tail or not elem.tail.strip():
|
|
|
|
elem.tail = i
|
|
|
|
for elem in elem:
|
2015-02-15 02:44:00 -08:00
|
|
|
self.indent(elem, level + 1)
|
2015-02-12 14:57:46 -08:00
|
|
|
if not elem.tail or not elem.tail.strip():
|
|
|
|
elem.tail = i
|
|
|
|
else:
|
|
|
|
if level and (not elem.tail or not elem.tail.strip()):
|
|
|
|
elem.tail = i
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def convertMetadataToXML(self, filename, metadata):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
# shorthand for the metadata
|
2015-02-12 14:57:46 -08:00
|
|
|
md = metadata
|
|
|
|
|
|
|
|
# build a tree structure
|
|
|
|
root = ET.Element("comet")
|
|
|
|
root.attrib['xmlns:comet'] = "http://www.denvog.com/comet/"
|
|
|
|
root.attrib['xmlns:xsi'] = "http://www.w3.org/2001/XMLSchema-instance"
|
2015-02-15 02:44:00 -08:00
|
|
|
root.attrib[
|
|
|
|
'xsi:schemaLocation'] = "http://www.denvog.com http://www.denvog.com/comet/comet.xsd"
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
# helper func
|
2015-02-13 15:08:07 -08:00
|
|
|
def assign(comet_entry, md_entry):
|
2015-02-12 14:57:46 -08:00
|
|
|
if md_entry is not None:
|
|
|
|
ET.SubElement(root, comet_entry).text = u"{0}".format(md_entry)
|
|
|
|
|
|
|
|
# title is manditory
|
|
|
|
if md.title is None:
|
|
|
|
md.title = ""
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('title', md.title)
|
|
|
|
assign('series', md.series)
|
2015-02-15 02:44:00 -08:00
|
|
|
assign('issue', md.issue) # must be int??
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('volume', md.volume)
|
|
|
|
assign('description', md.comments)
|
|
|
|
assign('publisher', md.publisher)
|
|
|
|
assign('pages', md.pageCount)
|
|
|
|
assign('format', md.format)
|
|
|
|
assign('language', md.language)
|
|
|
|
assign('rating', md.maturityRating)
|
|
|
|
assign('price', md.price)
|
|
|
|
assign('isVersionOf', md.isVersionOf)
|
|
|
|
assign('rights', md.rights)
|
|
|
|
assign('identifier', md.identifier)
|
|
|
|
assign('lastMark', md.lastMark)
|
|
|
|
assign('genre', md.genre) # TODO repeatable
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
if md.characters is not None:
|
2015-02-15 02:44:00 -08:00
|
|
|
char_list = [c.strip() for c in md.characters.split(',')]
|
2015-02-12 14:57:46 -08:00
|
|
|
for c in char_list:
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('character', c)
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
if md.manga is not None and md.manga == "YesAndRightToLeft":
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('readingDirection', "rtl")
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
date_str = ""
|
|
|
|
if md.year is not None:
|
|
|
|
date_str = str(md.year).zfill(4)
|
|
|
|
if md.month is not None:
|
|
|
|
date_str += "-" + str(md.month).zfill(2)
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('date', date_str)
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
assign('coverImage', md.coverImage)
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
# need to specially process the credits, since they are structured
|
|
|
|
# differently than CIX
|
|
|
|
credit_writer_list = list()
|
2015-02-12 14:57:46 -08:00
|
|
|
credit_penciller_list = list()
|
2015-02-15 02:44:00 -08:00
|
|
|
credit_inker_list = list()
|
|
|
|
credit_colorist_list = list()
|
|
|
|
credit_letterer_list = list()
|
|
|
|
credit_cover_list = list()
|
|
|
|
credit_editor_list = list()
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
# loop thru credits, and build a list for each role that CoMet supports
|
2015-02-12 14:57:46 -08:00
|
|
|
for credit in metadata.credits:
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.writer_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'writer').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.penciller_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'penciller').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.inker_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'inker').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.colorist_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'colorist').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.letterer_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'letterer').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.cover_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'coverDesigner').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
if credit['role'].lower() in set(self.editor_synonyms):
|
2015-02-15 02:44:00 -08:00
|
|
|
ET.SubElement(root, 'editor').text = u"{0}".format(
|
|
|
|
credit['person'])
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
# self pretty-print
|
|
|
|
self.indent(root)
|
|
|
|
|
|
|
|
# wrap it in an ElementTree instance, and save as XML
|
|
|
|
tree = ET.ElementTree(root)
|
|
|
|
return tree
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def convertXMLToMetadata(self, tree):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
root = tree.getroot()
|
|
|
|
|
|
|
|
if root.tag != 'comet':
|
|
|
|
raise 1
|
|
|
|
return None
|
|
|
|
|
|
|
|
metadata = GenericMetadata()
|
|
|
|
md = metadata
|
|
|
|
|
|
|
|
# Helper function
|
2015-02-13 15:08:07 -08:00
|
|
|
def xlate(tag):
|
|
|
|
node = root.find(tag)
|
2015-02-12 14:57:46 -08:00
|
|
|
if node is not None:
|
|
|
|
return node.text
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
md.series = xlate('series')
|
|
|
|
md.title = xlate('title')
|
|
|
|
md.issue = xlate('issue')
|
|
|
|
md.volume = xlate('volume')
|
|
|
|
md.comments = xlate('description')
|
|
|
|
md.publisher = xlate('publisher')
|
|
|
|
md.language = xlate('language')
|
|
|
|
md.format = xlate('format')
|
|
|
|
md.pageCount = xlate('pages')
|
|
|
|
md.maturityRating = xlate('rating')
|
|
|
|
md.price = xlate('price')
|
|
|
|
md.isVersionOf = xlate('isVersionOf')
|
|
|
|
md.rights = xlate('rights')
|
|
|
|
md.identifier = xlate('identifier')
|
|
|
|
md.lastMark = xlate('lastMark')
|
|
|
|
md.genre = xlate('genre') # TODO - repeatable field
|
2015-02-13 15:08:07 -08:00
|
|
|
|
|
|
|
date = xlate('date')
|
2015-02-12 14:57:46 -08:00
|
|
|
if date is not None:
|
|
|
|
parts = date.split('-')
|
2015-02-13 15:08:07 -08:00
|
|
|
if len(parts) > 0:
|
2015-02-12 14:57:46 -08:00
|
|
|
md.year = parts[0]
|
2015-02-13 15:08:07 -08:00
|
|
|
if len(parts) > 1:
|
2015-02-12 14:57:46 -08:00
|
|
|
md.month = parts[1]
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
md.coverImage = xlate('coverImage')
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
readingDirection = xlate('readingDirection')
|
2015-02-12 14:57:46 -08:00
|
|
|
if readingDirection is not None and readingDirection == "rtl":
|
|
|
|
md.manga = "YesAndRightToLeft"
|
|
|
|
|
|
|
|
# loop for character tags
|
2015-02-15 02:44:00 -08:00
|
|
|
char_list = []
|
2015-02-12 14:57:46 -08:00
|
|
|
for n in root:
|
|
|
|
if n.tag == 'character':
|
|
|
|
char_list.append(n.text.strip())
|
2015-02-13 15:08:07 -08:00
|
|
|
md.characters = utils.listToString(char_list)
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
# Now extract the credit info
|
|
|
|
for n in root:
|
2015-02-13 15:08:07 -08:00
|
|
|
if (n.tag == 'writer' or
|
2015-02-15 02:44:00 -08:00
|
|
|
n.tag == 'penciller' or
|
|
|
|
n.tag == 'inker' or
|
|
|
|
n.tag == 'colorist' or
|
|
|
|
n.tag == 'letterer' or
|
|
|
|
n.tag == 'editor'
|
|
|
|
):
|
2015-02-13 15:08:07 -08:00
|
|
|
metadata.addCredit(n.text.strip(), n.tag.title())
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
if n.tag == 'coverDesigner':
|
2015-02-13 15:08:07 -08:00
|
|
|
metadata.addCredit(n.text.strip(), "Cover")
|
2015-02-12 14:57:46 -08:00
|
|
|
|
|
|
|
metadata.isEmpty = False
|
|
|
|
|
|
|
|
return metadata
|
|
|
|
|
2015-02-15 02:44:00 -08:00
|
|
|
# verify that the string actually contains CoMet data in XML format
|
2015-02-13 15:08:07 -08:00
|
|
|
def validateString(self, string):
|
2015-02-12 14:57:46 -08:00
|
|
|
try:
|
2015-02-13 15:08:07 -08:00
|
|
|
tree = ET.ElementTree(ET.fromstring(string))
|
2015-02-12 14:57:46 -08:00
|
|
|
root = tree.getroot()
|
|
|
|
if root.tag != 'comet':
|
|
|
|
raise Exception
|
|
|
|
except:
|
|
|
|
return False
|
|
|
|
|
|
|
|
return True
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def writeToExternalFile(self, filename, metadata):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
tree = self.convertMetadataToXML(self, metadata)
|
2015-02-15 02:44:00 -08:00
|
|
|
# ET.dump(tree)
|
2015-02-12 14:57:46 -08:00
|
|
|
tree.write(filename, encoding='utf-8')
|
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
def readFromExternalFile(self, filename):
|
2015-02-12 14:57:46 -08:00
|
|
|
|
2015-02-13 15:08:07 -08:00
|
|
|
tree = ET.parse(filename)
|
|
|
|
return self.convertXMLToMetadata(tree)
|