2015-02-16 04:27:21 -08:00
|
|
|
# coding=utf-8
|
2015-02-21 18:30:32 -08:00
|
|
|
"""Some generic utilities"""
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
# Copyright 2012-2014 Anthony Beville
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2020-07-06 16:11:15 -07:00
|
|
|
import codecs
|
|
|
|
import locale
|
2015-02-16 04:27:21 -08:00
|
|
|
import os
|
|
|
|
import platform
|
2020-07-06 16:11:15 -07:00
|
|
|
import re
|
|
|
|
import sys
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
|
|
|
class UtilsVars:
|
2015-02-21 18:30:32 -08:00
|
|
|
already_fixed_encoding = False
|
|
|
|
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
def get_actual_preferred_encoding():
|
2015-02-21 18:30:32 -08:00
|
|
|
preferred_encoding = locale.getpreferredencoding()
|
|
|
|
if platform.system() == "Darwin":
|
|
|
|
preferred_encoding = "utf-8"
|
|
|
|
return preferred_encoding
|
|
|
|
|
|
|
|
|
|
|
|
def fix_output_encoding():
|
|
|
|
if not UtilsVars.already_fixed_encoding:
|
|
|
|
# this reads the environment and inits the right locale
|
|
|
|
locale.setlocale(locale.LC_ALL, "")
|
|
|
|
|
|
|
|
# try to make stdout/stderr encodings happy for unicode printing
|
|
|
|
preferred_encoding = get_actual_preferred_encoding()
|
|
|
|
sys.stdout = codecs.getwriter(preferred_encoding)(sys.stdout)
|
|
|
|
sys.stderr = codecs.getwriter(preferred_encoding)(sys.stderr)
|
|
|
|
UtilsVars.already_fixed_encoding = True
|
|
|
|
|
|
|
|
|
|
|
|
def get_recursive_filelist(pathlist):
|
|
|
|
"""Get a recursive list of of all files under all path items in the list"""
|
|
|
|
|
|
|
|
filename_encoding = sys.getfilesystemencoding()
|
|
|
|
filelist = []
|
|
|
|
for p in pathlist:
|
|
|
|
# if path is a folder, walk it recursively, and all files underneath
|
|
|
|
if isinstance(p, str):
|
|
|
|
# make sure string is unicode
|
2020-07-06 16:11:15 -07:00
|
|
|
# p = p.decode(filename_encoding) # , 'replace')
|
2018-09-19 13:05:39 -07:00
|
|
|
pass
|
|
|
|
elif not isinstance(p, str):
|
2015-02-21 18:30:32 -08:00
|
|
|
# it's probably a QString
|
2018-09-19 13:05:39 -07:00
|
|
|
p = str(p)
|
2015-02-21 18:30:32 -08:00
|
|
|
|
|
|
|
if os.path.isdir(p):
|
|
|
|
for root, dirs, files in os.walk(p):
|
|
|
|
for f in files:
|
|
|
|
if isinstance(f, str):
|
|
|
|
# make sure string is unicode
|
2020-07-06 16:11:15 -07:00
|
|
|
# f = f.decode(filename_encoding, 'replace')
|
2018-09-19 13:05:39 -07:00
|
|
|
pass
|
|
|
|
elif not isinstance(f, str):
|
2015-02-21 18:30:32 -08:00
|
|
|
# it's probably a QString
|
2018-09-19 13:05:39 -07:00
|
|
|
f = str(f)
|
2015-02-21 18:30:32 -08:00
|
|
|
filelist.append(os.path.join(root, f))
|
|
|
|
else:
|
|
|
|
filelist.append(p)
|
|
|
|
|
|
|
|
return filelist
|
|
|
|
|
|
|
|
|
|
|
|
def listToString(l):
|
|
|
|
string = ""
|
|
|
|
if l is not None:
|
|
|
|
for item in l:
|
|
|
|
if len(string) > 0:
|
|
|
|
string += ", "
|
|
|
|
string += item
|
|
|
|
return string
|
|
|
|
|
|
|
|
|
|
|
|
def addtopath(dirname):
|
|
|
|
if dirname is not None and dirname != "":
|
|
|
|
|
|
|
|
# verify that path doesn't already contain the given dirname
|
|
|
|
tmpdirname = re.escape(dirname)
|
2020-07-06 16:11:15 -07:00
|
|
|
pattern = r"{sep}{dir}$|^{dir}{sep}|{sep}{dir}{sep}|^{dir}$".format(dir=tmpdirname, sep=os.pathsep)
|
2015-02-21 18:30:32 -08:00
|
|
|
|
2020-07-06 16:11:15 -07:00
|
|
|
match = re.search(pattern, os.environ["PATH"])
|
2015-02-21 18:30:32 -08:00
|
|
|
if not match:
|
2020-07-06 16:11:15 -07:00
|
|
|
os.environ["PATH"] = dirname + os.pathsep + os.environ["PATH"]
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def which(program):
|
|
|
|
"""Returns path of the executable, if it exists"""
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def is_exe(fpath):
|
|
|
|
return os.path.isfile(fpath) and os.access(fpath, os.X_OK)
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
fpath, fname = os.path.split(program)
|
|
|
|
if fpath:
|
|
|
|
if is_exe(program):
|
|
|
|
return program
|
|
|
|
else:
|
|
|
|
for path in os.environ["PATH"].split(os.pathsep):
|
|
|
|
exe_file = os.path.join(path, program)
|
|
|
|
if is_exe(exe_file):
|
|
|
|
return exe_file
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
return None
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2019-09-05 14:40:14 -07:00
|
|
|
def xlate(data, isInt=False):
|
|
|
|
class Default(dict):
|
|
|
|
def __missing__(self, key):
|
|
|
|
return None
|
2020-07-06 16:11:15 -07:00
|
|
|
|
2019-09-05 14:40:14 -07:00
|
|
|
if data is None or data == "":
|
|
|
|
return None
|
|
|
|
if isInt:
|
2020-07-06 16:11:15 -07:00
|
|
|
i = str(data).translate(Default(zip((ord(c) for c in "1234567890"), "1234567890")))
|
2019-09-05 14:40:14 -07:00
|
|
|
if i == "0":
|
|
|
|
return "0"
|
|
|
|
if i is "":
|
|
|
|
return None
|
|
|
|
return int(i)
|
|
|
|
else:
|
|
|
|
return str(data)
|
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def removearticles(text):
|
|
|
|
text = text.lower()
|
2020-07-06 16:11:15 -07:00
|
|
|
articles = ["and", "a", "&", "issue", "the"]
|
|
|
|
newText = ""
|
|
|
|
for word in text.split(" "):
|
2015-02-21 18:30:32 -08:00
|
|
|
if word not in articles:
|
2020-07-06 16:11:15 -07:00
|
|
|
newText += word + " "
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
newText = newText[:-1]
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
return newText
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def unique_file(file_name):
|
|
|
|
counter = 1
|
|
|
|
# returns ('/path/file', '.ext')
|
|
|
|
file_name_parts = os.path.splitext(file_name)
|
|
|
|
while True:
|
|
|
|
if not os.path.lexists(file_name):
|
|
|
|
return file_name
|
2020-07-06 16:11:15 -07:00
|
|
|
file_name = file_name_parts[0] + " (" + str(counter) + ")" + file_name_parts[1]
|
2015-02-21 18:30:32 -08:00
|
|
|
counter += 1
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
# -o- coding: utf-8 -o-
|
|
|
|
# ISO639 python dict
|
|
|
|
# official list in http://www.loc.gov/standards/iso639-2/php/code_list.php
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
lang_dict = {
|
2020-07-06 16:11:15 -07:00
|
|
|
"ab": "Abkhaz",
|
|
|
|
"aa": "Afar",
|
|
|
|
"af": "Afrikaans",
|
|
|
|
"ak": "Akan",
|
|
|
|
"sq": "Albanian",
|
|
|
|
"am": "Amharic",
|
|
|
|
"ar": "Arabic",
|
|
|
|
"an": "Aragonese",
|
|
|
|
"hy": "Armenian",
|
|
|
|
"as": "Assamese",
|
|
|
|
"av": "Avaric",
|
|
|
|
"ae": "Avestan",
|
|
|
|
"ay": "Aymara",
|
|
|
|
"az": "Azerbaijani",
|
|
|
|
"bm": "Bambara",
|
|
|
|
"ba": "Bashkir",
|
|
|
|
"eu": "Basque",
|
|
|
|
"be": "Belarusian",
|
|
|
|
"bn": "Bengali",
|
|
|
|
"bh": "Bihari",
|
|
|
|
"bi": "Bislama",
|
|
|
|
"bs": "Bosnian",
|
|
|
|
"br": "Breton",
|
|
|
|
"bg": "Bulgarian",
|
|
|
|
"my": "Burmese",
|
|
|
|
"ca": "Catalan; Valencian",
|
|
|
|
"ch": "Chamorro",
|
|
|
|
"ce": "Chechen",
|
|
|
|
"ny": "Chichewa; Chewa; Nyanja",
|
|
|
|
"zh": "Chinese",
|
|
|
|
"cv": "Chuvash",
|
|
|
|
"kw": "Cornish",
|
|
|
|
"co": "Corsican",
|
|
|
|
"cr": "Cree",
|
|
|
|
"hr": "Croatian",
|
|
|
|
"cs": "Czech",
|
|
|
|
"da": "Danish",
|
|
|
|
"dv": "Divehi; Maldivian;",
|
|
|
|
"nl": "Dutch",
|
|
|
|
"dz": "Dzongkha",
|
|
|
|
"en": "English",
|
|
|
|
"eo": "Esperanto",
|
|
|
|
"et": "Estonian",
|
|
|
|
"ee": "Ewe",
|
|
|
|
"fo": "Faroese",
|
|
|
|
"fj": "Fijian",
|
|
|
|
"fi": "Finnish",
|
|
|
|
"fr": "French",
|
|
|
|
"ff": "Fula",
|
|
|
|
"gl": "Galician",
|
|
|
|
"ka": "Georgian",
|
|
|
|
"de": "German",
|
|
|
|
"el": "Greek, Modern",
|
|
|
|
"gn": "Guaraní",
|
|
|
|
"gu": "Gujarati",
|
|
|
|
"ht": "Haitian",
|
|
|
|
"ha": "Hausa",
|
|
|
|
"he": "Hebrew (modern)",
|
|
|
|
"hz": "Herero",
|
|
|
|
"hi": "Hindi",
|
|
|
|
"ho": "Hiri Motu",
|
|
|
|
"hu": "Hungarian",
|
|
|
|
"ia": "Interlingua",
|
|
|
|
"id": "Indonesian",
|
|
|
|
"ie": "Interlingue",
|
|
|
|
"ga": "Irish",
|
|
|
|
"ig": "Igbo",
|
|
|
|
"ik": "Inupiaq",
|
|
|
|
"io": "Ido",
|
|
|
|
"is": "Icelandic",
|
|
|
|
"it": "Italian",
|
|
|
|
"iu": "Inuktitut",
|
|
|
|
"ja": "Japanese",
|
|
|
|
"jv": "Javanese",
|
|
|
|
"kl": "Kalaallisut",
|
|
|
|
"kn": "Kannada",
|
|
|
|
"kr": "Kanuri",
|
|
|
|
"ks": "Kashmiri",
|
|
|
|
"kk": "Kazakh",
|
|
|
|
"km": "Khmer",
|
|
|
|
"ki": "Kikuyu, Gikuyu",
|
|
|
|
"rw": "Kinyarwanda",
|
|
|
|
"ky": "Kirghiz, Kyrgyz",
|
|
|
|
"kv": "Komi",
|
|
|
|
"kg": "Kongo",
|
|
|
|
"ko": "Korean",
|
|
|
|
"ku": "Kurdish",
|
|
|
|
"kj": "Kwanyama, Kuanyama",
|
|
|
|
"la": "Latin",
|
|
|
|
"lb": "Luxembourgish",
|
|
|
|
"lg": "Luganda",
|
|
|
|
"li": "Limburgish",
|
|
|
|
"ln": "Lingala",
|
|
|
|
"lo": "Lao",
|
|
|
|
"lt": "Lithuanian",
|
|
|
|
"lu": "Luba-Katanga",
|
|
|
|
"lv": "Latvian",
|
|
|
|
"gv": "Manx",
|
|
|
|
"mk": "Macedonian",
|
|
|
|
"mg": "Malagasy",
|
|
|
|
"ms": "Malay",
|
|
|
|
"ml": "Malayalam",
|
|
|
|
"mt": "Maltese",
|
|
|
|
"mi": "Māori",
|
|
|
|
"mr": "Marathi (Marāṭhī)",
|
|
|
|
"mh": "Marshallese",
|
|
|
|
"mn": "Mongolian",
|
|
|
|
"na": "Nauru",
|
|
|
|
"nv": "Navajo, Navaho",
|
|
|
|
"nb": "Norwegian Bokmål",
|
|
|
|
"nd": "North Ndebele",
|
|
|
|
"ne": "Nepali",
|
|
|
|
"ng": "Ndonga",
|
|
|
|
"nn": "Norwegian Nynorsk",
|
|
|
|
"no": "Norwegian",
|
|
|
|
"ii": "Nuosu",
|
|
|
|
"nr": "South Ndebele",
|
|
|
|
"oc": "Occitan",
|
|
|
|
"oj": "Ojibwe, Ojibwa",
|
|
|
|
"cu": "Old Church Slavonic",
|
|
|
|
"om": "Oromo",
|
|
|
|
"or": "Oriya",
|
|
|
|
"os": "Ossetian, Ossetic",
|
|
|
|
"pa": "Panjabi, Punjabi",
|
|
|
|
"pi": "Pāli",
|
|
|
|
"fa": "Persian",
|
|
|
|
"pl": "Polish",
|
|
|
|
"ps": "Pashto, Pushto",
|
|
|
|
"pt": "Portuguese",
|
|
|
|
"qu": "Quechua",
|
|
|
|
"rm": "Romansh",
|
|
|
|
"rn": "Kirundi",
|
|
|
|
"ro": "Romanian, Moldavan",
|
|
|
|
"ru": "Russian",
|
|
|
|
"sa": "Sanskrit (Saṁskṛta)",
|
|
|
|
"sc": "Sardinian",
|
|
|
|
"sd": "Sindhi",
|
|
|
|
"se": "Northern Sami",
|
|
|
|
"sm": "Samoan",
|
|
|
|
"sg": "Sango",
|
|
|
|
"sr": "Serbian",
|
|
|
|
"gd": "Scottish Gaelic",
|
|
|
|
"sn": "Shona",
|
|
|
|
"si": "Sinhala, Sinhalese",
|
|
|
|
"sk": "Slovak",
|
|
|
|
"sl": "Slovene",
|
|
|
|
"so": "Somali",
|
|
|
|
"st": "Southern Sotho",
|
|
|
|
"es": "Spanish; Castilian",
|
|
|
|
"su": "Sundanese",
|
|
|
|
"sw": "Swahili",
|
|
|
|
"ss": "Swati",
|
|
|
|
"sv": "Swedish",
|
|
|
|
"ta": "Tamil",
|
|
|
|
"te": "Telugu",
|
|
|
|
"tg": "Tajik",
|
|
|
|
"th": "Thai",
|
|
|
|
"ti": "Tigrinya",
|
|
|
|
"bo": "Tibetan",
|
|
|
|
"tk": "Turkmen",
|
|
|
|
"tl": "Tagalog",
|
|
|
|
"tn": "Tswana",
|
|
|
|
"to": "Tonga",
|
|
|
|
"tr": "Turkish",
|
|
|
|
"ts": "Tsonga",
|
|
|
|
"tt": "Tatar",
|
|
|
|
"tw": "Twi",
|
|
|
|
"ty": "Tahitian",
|
|
|
|
"ug": "Uighur, Uyghur",
|
|
|
|
"uk": "Ukrainian",
|
|
|
|
"ur": "Urdu",
|
|
|
|
"uz": "Uzbek",
|
|
|
|
"ve": "Venda",
|
|
|
|
"vi": "Vietnamese",
|
|
|
|
"vo": "Volapük",
|
|
|
|
"wa": "Walloon",
|
|
|
|
"cy": "Welsh",
|
|
|
|
"wo": "Wolof",
|
|
|
|
"fy": "Western Frisian",
|
|
|
|
"xh": "Xhosa",
|
|
|
|
"yi": "Yiddish",
|
|
|
|
"yo": "Yoruba",
|
|
|
|
"za": "Zhuang, Chuang",
|
|
|
|
"zu": "Zulu",
|
2015-02-21 18:30:32 -08:00
|
|
|
}
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
countries = [
|
2020-07-06 16:11:15 -07:00
|
|
|
("AF", "Afghanistan"),
|
|
|
|
("AL", "Albania"),
|
|
|
|
("DZ", "Algeria"),
|
|
|
|
("AS", "American Samoa"),
|
|
|
|
("AD", "Andorra"),
|
|
|
|
("AO", "Angola"),
|
|
|
|
("AI", "Anguilla"),
|
|
|
|
("AQ", "Antarctica"),
|
|
|
|
("AG", "Antigua And Barbuda"),
|
|
|
|
("AR", "Argentina"),
|
|
|
|
("AM", "Armenia"),
|
|
|
|
("AW", "Aruba"),
|
|
|
|
("AU", "Australia"),
|
|
|
|
("AT", "Austria"),
|
|
|
|
("AZ", "Azerbaijan"),
|
|
|
|
("BS", "Bahamas"),
|
|
|
|
("BH", "Bahrain"),
|
|
|
|
("BD", "Bangladesh"),
|
|
|
|
("BB", "Barbados"),
|
|
|
|
("BY", "Belarus"),
|
|
|
|
("BE", "Belgium"),
|
|
|
|
("BZ", "Belize"),
|
|
|
|
("BJ", "Benin"),
|
|
|
|
("BM", "Bermuda"),
|
|
|
|
("BT", "Bhutan"),
|
|
|
|
("BO", "Bolivia"),
|
|
|
|
("BA", "Bosnia And Herzegowina"),
|
|
|
|
("BW", "Botswana"),
|
|
|
|
("BV", "Bouvet Island"),
|
|
|
|
("BR", "Brazil"),
|
|
|
|
("BN", "Brunei Darussalam"),
|
|
|
|
("BG", "Bulgaria"),
|
|
|
|
("BF", "Burkina Faso"),
|
|
|
|
("BI", "Burundi"),
|
|
|
|
("KH", "Cambodia"),
|
|
|
|
("CM", "Cameroon"),
|
|
|
|
("CA", "Canada"),
|
|
|
|
("CV", "Cape Verde"),
|
|
|
|
("KY", "Cayman Islands"),
|
|
|
|
("CF", "Central African Rep"),
|
|
|
|
("TD", "Chad"),
|
|
|
|
("CL", "Chile"),
|
|
|
|
("CN", "China"),
|
|
|
|
("CX", "Christmas Island"),
|
|
|
|
("CC", "Cocos Islands"),
|
|
|
|
("CO", "Colombia"),
|
|
|
|
("KM", "Comoros"),
|
|
|
|
("CG", "Congo"),
|
|
|
|
("CK", "Cook Islands"),
|
|
|
|
("CR", "Costa Rica"),
|
|
|
|
("CI", "Cote D`ivoire"),
|
|
|
|
("HR", "Croatia"),
|
|
|
|
("CU", "Cuba"),
|
|
|
|
("CY", "Cyprus"),
|
|
|
|
("CZ", "Czech Republic"),
|
|
|
|
("DK", "Denmark"),
|
|
|
|
("DJ", "Djibouti"),
|
|
|
|
("DM", "Dominica"),
|
|
|
|
("DO", "Dominican Republic"),
|
|
|
|
("TP", "East Timor"),
|
|
|
|
("EC", "Ecuador"),
|
|
|
|
("EG", "Egypt"),
|
|
|
|
("SV", "El Salvador"),
|
|
|
|
("GQ", "Equatorial Guinea"),
|
|
|
|
("ER", "Eritrea"),
|
|
|
|
("EE", "Estonia"),
|
|
|
|
("ET", "Ethiopia"),
|
|
|
|
("FK", "Falkland Islands (Malvinas)"),
|
|
|
|
("FO", "Faroe Islands"),
|
|
|
|
("FJ", "Fiji"),
|
|
|
|
("FI", "Finland"),
|
|
|
|
("FR", "France"),
|
|
|
|
("GF", "French Guiana"),
|
|
|
|
("PF", "French Polynesia"),
|
|
|
|
("TF", "French S. Territories"),
|
|
|
|
("GA", "Gabon"),
|
|
|
|
("GM", "Gambia"),
|
|
|
|
("GE", "Georgia"),
|
|
|
|
("DE", "Germany"),
|
|
|
|
("GH", "Ghana"),
|
|
|
|
("GI", "Gibraltar"),
|
|
|
|
("GR", "Greece"),
|
|
|
|
("GL", "Greenland"),
|
|
|
|
("GD", "Grenada"),
|
|
|
|
("GP", "Guadeloupe"),
|
|
|
|
("GU", "Guam"),
|
|
|
|
("GT", "Guatemala"),
|
|
|
|
("GN", "Guinea"),
|
|
|
|
("GW", "Guinea-bissau"),
|
|
|
|
("GY", "Guyana"),
|
|
|
|
("HT", "Haiti"),
|
|
|
|
("HN", "Honduras"),
|
|
|
|
("HK", "Hong Kong"),
|
|
|
|
("HU", "Hungary"),
|
|
|
|
("IS", "Iceland"),
|
|
|
|
("IN", "India"),
|
|
|
|
("ID", "Indonesia"),
|
|
|
|
("IR", "Iran"),
|
|
|
|
("IQ", "Iraq"),
|
|
|
|
("IE", "Ireland"),
|
|
|
|
("IL", "Israel"),
|
|
|
|
("IT", "Italy"),
|
|
|
|
("JM", "Jamaica"),
|
|
|
|
("JP", "Japan"),
|
|
|
|
("JO", "Jordan"),
|
|
|
|
("KZ", "Kazakhstan"),
|
|
|
|
("KE", "Kenya"),
|
|
|
|
("KI", "Kiribati"),
|
|
|
|
("KP", "Korea (North)"),
|
|
|
|
("KR", "Korea (South)"),
|
|
|
|
("KW", "Kuwait"),
|
|
|
|
("KG", "Kyrgyzstan"),
|
|
|
|
("LA", "Laos"),
|
|
|
|
("LV", "Latvia"),
|
|
|
|
("LB", "Lebanon"),
|
|
|
|
("LS", "Lesotho"),
|
|
|
|
("LR", "Liberia"),
|
|
|
|
("LY", "Libya"),
|
|
|
|
("LI", "Liechtenstein"),
|
|
|
|
("LT", "Lithuania"),
|
|
|
|
("LU", "Luxembourg"),
|
|
|
|
("MO", "Macau"),
|
|
|
|
("MK", "Macedonia"),
|
|
|
|
("MG", "Madagascar"),
|
|
|
|
("MW", "Malawi"),
|
|
|
|
("MY", "Malaysia"),
|
|
|
|
("MV", "Maldives"),
|
|
|
|
("ML", "Mali"),
|
|
|
|
("MT", "Malta"),
|
|
|
|
("MH", "Marshall Islands"),
|
|
|
|
("MQ", "Martinique"),
|
|
|
|
("MR", "Mauritania"),
|
|
|
|
("MU", "Mauritius"),
|
|
|
|
("YT", "Mayotte"),
|
|
|
|
("MX", "Mexico"),
|
|
|
|
("FM", "Micronesia"),
|
|
|
|
("MD", "Moldova"),
|
|
|
|
("MC", "Monaco"),
|
|
|
|
("MN", "Mongolia"),
|
|
|
|
("MS", "Montserrat"),
|
|
|
|
("MA", "Morocco"),
|
|
|
|
("MZ", "Mozambique"),
|
|
|
|
("MM", "Myanmar"),
|
|
|
|
("NA", "Namibia"),
|
|
|
|
("NR", "Nauru"),
|
|
|
|
("NP", "Nepal"),
|
|
|
|
("NL", "Netherlands"),
|
|
|
|
("AN", "Netherlands Antilles"),
|
|
|
|
("NC", "New Caledonia"),
|
|
|
|
("NZ", "New Zealand"),
|
|
|
|
("NI", "Nicaragua"),
|
|
|
|
("NE", "Niger"),
|
|
|
|
("NG", "Nigeria"),
|
|
|
|
("NU", "Niue"),
|
|
|
|
("NF", "Norfolk Island"),
|
|
|
|
("MP", "Northern Mariana Islands"),
|
|
|
|
("NO", "Norway"),
|
|
|
|
("OM", "Oman"),
|
|
|
|
("PK", "Pakistan"),
|
|
|
|
("PW", "Palau"),
|
|
|
|
("PA", "Panama"),
|
|
|
|
("PG", "Papua New Guinea"),
|
|
|
|
("PY", "Paraguay"),
|
|
|
|
("PE", "Peru"),
|
|
|
|
("PH", "Philippines"),
|
|
|
|
("PN", "Pitcairn"),
|
|
|
|
("PL", "Poland"),
|
|
|
|
("PT", "Portugal"),
|
|
|
|
("PR", "Puerto Rico"),
|
|
|
|
("QA", "Qatar"),
|
|
|
|
("RE", "Reunion"),
|
|
|
|
("RO", "Romania"),
|
|
|
|
("RU", "Russian Federation"),
|
|
|
|
("RW", "Rwanda"),
|
|
|
|
("KN", "Saint Kitts And Nevis"),
|
|
|
|
("LC", "Saint Lucia"),
|
|
|
|
("VC", "St Vincent/Grenadines"),
|
|
|
|
("WS", "Samoa"),
|
|
|
|
("SM", "San Marino"),
|
|
|
|
("ST", "Sao Tome"),
|
|
|
|
("SA", "Saudi Arabia"),
|
|
|
|
("SN", "Senegal"),
|
|
|
|
("SC", "Seychelles"),
|
|
|
|
("SL", "Sierra Leone"),
|
|
|
|
("SG", "Singapore"),
|
|
|
|
("SK", "Slovakia"),
|
|
|
|
("SI", "Slovenia"),
|
|
|
|
("SB", "Solomon Islands"),
|
|
|
|
("SO", "Somalia"),
|
|
|
|
("ZA", "South Africa"),
|
|
|
|
("ES", "Spain"),
|
|
|
|
("LK", "Sri Lanka"),
|
|
|
|
("SH", "St. Helena"),
|
|
|
|
("PM", "St.Pierre"),
|
|
|
|
("SD", "Sudan"),
|
|
|
|
("SR", "Suriname"),
|
|
|
|
("SZ", "Swaziland"),
|
|
|
|
("SE", "Sweden"),
|
|
|
|
("CH", "Switzerland"),
|
|
|
|
("SY", "Syrian Arab Republic"),
|
|
|
|
("TW", "Taiwan"),
|
|
|
|
("TJ", "Tajikistan"),
|
|
|
|
("TZ", "Tanzania"),
|
|
|
|
("TH", "Thailand"),
|
|
|
|
("TG", "Togo"),
|
|
|
|
("TK", "Tokelau"),
|
|
|
|
("TO", "Tonga"),
|
|
|
|
("TT", "Trinidad And Tobago"),
|
|
|
|
("TN", "Tunisia"),
|
|
|
|
("TR", "Turkey"),
|
|
|
|
("TM", "Turkmenistan"),
|
|
|
|
("TV", "Tuvalu"),
|
|
|
|
("UG", "Uganda"),
|
|
|
|
("UA", "Ukraine"),
|
|
|
|
("AE", "United Arab Emirates"),
|
|
|
|
("UK", "United Kingdom"),
|
|
|
|
("US", "United States"),
|
|
|
|
("UY", "Uruguay"),
|
|
|
|
("UZ", "Uzbekistan"),
|
|
|
|
("VU", "Vanuatu"),
|
|
|
|
("VA", "Vatican City State"),
|
|
|
|
("VE", "Venezuela"),
|
|
|
|
("VN", "Viet Nam"),
|
|
|
|
("VG", "Virgin Islands (British)"),
|
|
|
|
("VI", "Virgin Islands (U.S.)"),
|
|
|
|
("EH", "Western Sahara"),
|
|
|
|
("YE", "Yemen"),
|
|
|
|
("YU", "Yugoslavia"),
|
|
|
|
("ZR", "Zaire"),
|
|
|
|
("ZM", "Zambia"),
|
|
|
|
("ZW", "Zimbabwe"),
|
2015-02-21 18:30:32 -08:00
|
|
|
]
|
2015-02-16 04:27:21 -08:00
|
|
|
|
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def getLanguageDict():
|
|
|
|
return lang_dict
|
|
|
|
|
2015-02-16 04:27:21 -08:00
|
|
|
|
2015-02-21 18:30:32 -08:00
|
|
|
def getLanguageFromISO(iso):
|
|
|
|
if iso is None:
|
|
|
|
return None
|
|
|
|
else:
|
|
|
|
return lang_dict[iso]
|
2019-09-10 14:34:09 -07:00
|
|
|
|
|
|
|
|
|
|
|
def getPublisher(publisher):
|
|
|
|
if publisher is None:
|
|
|
|
return ("", "")
|
|
|
|
imprint = ""
|
|
|
|
|
|
|
|
for pub in publishers:
|
|
|
|
imprint, publisher, ok = pub[publisher]
|
|
|
|
if ok:
|
|
|
|
break
|
|
|
|
|
|
|
|
return (imprint, publisher)
|
|
|
|
|
|
|
|
|
|
|
|
class ImprintDict(dict):
|
2020-07-06 16:11:15 -07:00
|
|
|
"""
|
2019-09-10 14:34:09 -07:00
|
|
|
ImprintDict takes a publisher and a dict or mapping of lowercased
|
|
|
|
imprint names to the proper imprint name. Retreiving a value from an
|
|
|
|
ImportDict returns a tuple of (imprint, publisher, keyExists).
|
|
|
|
if the key does not exist the key is returned as the publisher unchanged
|
2020-07-06 16:11:15 -07:00
|
|
|
"""
|
|
|
|
|
2019-09-10 14:34:09 -07:00
|
|
|
def __init__(self, publisher, mapping=(), **kwargs):
|
|
|
|
super().__init__(mapping, **kwargs)
|
|
|
|
self.publisher = publisher
|
|
|
|
|
|
|
|
def __missing__(self, key):
|
|
|
|
return None
|
|
|
|
|
|
|
|
def __getitem__(self, k):
|
|
|
|
item = super().__getitem__(k.lower())
|
|
|
|
if item is None:
|
|
|
|
return ("", k, False)
|
|
|
|
else:
|
|
|
|
return (item, self.publisher, True)
|
|
|
|
|
2020-07-06 16:11:15 -07:00
|
|
|
|
|
|
|
Marvel = ImprintDict(
|
|
|
|
"Marvel",
|
|
|
|
{
|
|
|
|
"marvel comics": "",
|
|
|
|
"marvel": "",
|
|
|
|
"aircel comics": "Aircel Comics",
|
|
|
|
"aircel": "Aircel Comics",
|
|
|
|
"atlas comics": "Atlas Comics",
|
|
|
|
"atlas": "Atlas Comics",
|
|
|
|
"crossgen comics": "CrossGen comics",
|
|
|
|
"crossgen": "CrossGen comics",
|
|
|
|
"curtis magazines": "Curtis Magazines",
|
|
|
|
"disney books group": "Disney Books Group",
|
|
|
|
"disney books": "Disney Books Group",
|
|
|
|
"disney kingdoms": "Disney Kingdoms",
|
|
|
|
"epic comics": "Epic Comics",
|
|
|
|
"epic": "Epic Comics",
|
|
|
|
"epic comics group": "Epic Comics",
|
|
|
|
"eternity comics": "Eternity Comics",
|
|
|
|
"humorama": "Humorama",
|
|
|
|
"icon comics": "Icon Comics",
|
|
|
|
"infinite comics": "Infinite Comics",
|
|
|
|
"malibu comics": "Malibu Comics",
|
|
|
|
"malibu": "Malibu Comics",
|
|
|
|
"marvel 2099": "Marvel 2099",
|
|
|
|
"marvel absurd": "Marvel Absurd",
|
|
|
|
"marvel adventures": "Marvel Adventures",
|
|
|
|
"marvel age": "Marvel Age",
|
|
|
|
"marvel books": "Marvel Books",
|
|
|
|
"marvel comics 2": "Marvel Comics 2",
|
|
|
|
"marvel edge": "Marvel Edge",
|
|
|
|
"marvel frontier": "Marvel Frontier",
|
|
|
|
"marvel illustrated": "Marvel Illustrated",
|
|
|
|
"marvel knights": "Marvel Knights",
|
|
|
|
"marvel digital comics unlimited": "Marvel Unlimited",
|
|
|
|
"marvel magazine group": "Marvel Magazine Group",
|
|
|
|
"marvel mangaverse": "Marvel Mangaverse",
|
|
|
|
"marvel monsters group": "Marvel Monsters Group",
|
|
|
|
"marvel music": "Marvel Music",
|
|
|
|
"marvel next": "Marvel Next",
|
|
|
|
"marvel noir": "Marvel Noir",
|
|
|
|
"marvel press": "Marvel Press",
|
|
|
|
"marvel uk": "Marvel UK",
|
|
|
|
"marvel unlimited": "Marvel Unlimited",
|
|
|
|
"max": "MAX",
|
|
|
|
"mc2": "Marvel Comics 2",
|
|
|
|
"new universe": "New Universe",
|
|
|
|
"non-pareil publishing corp.": "Non-Pareil Publishing Corp.",
|
|
|
|
"paramount comics": "Paramount Comics",
|
|
|
|
"power comics": "Power Comics",
|
|
|
|
"razorline": "Razorline",
|
|
|
|
"star comics": "Star Comics",
|
|
|
|
"timely comics": "Timely Comics",
|
|
|
|
"timely": "Timely Comics",
|
|
|
|
"tsunami": "Tsunami",
|
|
|
|
"ultimate comics": "Ultimate Comics",
|
|
|
|
"ultimate marvel": "Ultimate Marvel",
|
|
|
|
"vital publications, inc.": "Vital Publications, Inc.",
|
|
|
|
},
|
|
|
|
)
|
|
|
|
|
|
|
|
DC_Comics = ImprintDict(
|
|
|
|
"DC Comics",
|
|
|
|
{
|
|
|
|
"dc comics": "",
|
|
|
|
"dc_comics": "",
|
|
|
|
"dc": "",
|
|
|
|
"tangent comics": "Tangent Comics",
|
|
|
|
"dccomics": "",
|
|
|
|
"all star dc": "All-Star",
|
|
|
|
"all star": "All-Star",
|
|
|
|
"all-star dc": "All-Star",
|
|
|
|
"all-star": "All-Star",
|
|
|
|
"america's best comics": "America's Best Comics",
|
|
|
|
"black label": "DC Black Label",
|
|
|
|
"cliffhanger": "Cliffhanger",
|
|
|
|
"cmx manga": "CMX Manga",
|
|
|
|
"dc black label": "DC Black Label",
|
|
|
|
"dc focus": "DC Focus",
|
|
|
|
"dc ink": "DC Ink",
|
|
|
|
"dc zoom": "DC Zoom",
|
|
|
|
"earth m": "Earth M",
|
|
|
|
"earth one": "Earth One",
|
|
|
|
"earth-m": "Earth M",
|
|
|
|
"elseworlds": "Elseworlds",
|
|
|
|
"eo": "Earth One",
|
|
|
|
"first wave": "First Wave",
|
|
|
|
"focus": "DC Focus",
|
|
|
|
"helix": "Helix",
|
|
|
|
"homage comics": "Homage Comics",
|
|
|
|
"impact comics": "Impact Comics",
|
|
|
|
"impact! comics": "Impact Comics",
|
|
|
|
"!mpact comics": "Impact Comics",
|
|
|
|
"johnny dc": "Johnny DC",
|
|
|
|
"mad": "Mad",
|
|
|
|
"minx": "Minx",
|
|
|
|
"paradox press": "Paradox Press",
|
|
|
|
"piranha press": "Piranha Press",
|
|
|
|
"sandman universe": "Sandman Universe",
|
|
|
|
"tsr": "TSR",
|
|
|
|
"vertigo": "Vertigo",
|
|
|
|
"wildstorm productions": "WildStorm Productions",
|
|
|
|
"wildstorm signature": "WildStorm Productions",
|
|
|
|
"wildstorm": "WildStorm Productions",
|
|
|
|
"wonder comics": "Wonder Comics",
|
|
|
|
"young animal": "Young Animal",
|
|
|
|
"zuda comics": "Zuda Comics",
|
|
|
|
"zuda": "Zuda Comics",
|
|
|
|
},
|
|
|
|
)
|
|
|
|
|
|
|
|
Dark_Horse_Comics = ImprintDict(
|
|
|
|
"Dark Horse Comics",
|
|
|
|
{
|
|
|
|
"legend": "Legend",
|
|
|
|
"comics' greatest world": "Dark Horse Heroes",
|
|
|
|
"dark horse heroes": "Dark Horse Heroes",
|
|
|
|
"dark horse manga": "Dark Horse Manga",
|
|
|
|
"maverick": "Maverick",
|
|
|
|
"dh press": "DH Press",
|
|
|
|
"m press": "M Press",
|
|
|
|
"dark horse digital": "Dark Horse Digital",
|
|
|
|
"dh deluxe": "DH Deluxe",
|
|
|
|
"kitchen sink books": "Kitchen Sink Books",
|
|
|
|
"berger books": "Berger Books",
|
|
|
|
},
|
|
|
|
)
|
|
|
|
|
|
|
|
Archie_Comics = ImprintDict(
|
|
|
|
"Archie Comics",
|
|
|
|
{
|
|
|
|
"Archie Action": "Archie Action",
|
|
|
|
"Archie Horror": "Archie Horror",
|
|
|
|
"Dark Circle Comics": "Dark Circle Comics",
|
|
|
|
"Dark Circle": "Dark Circle Comics",
|
|
|
|
"Red Circle Comics": "Dark Circle Comics",
|
|
|
|
"Red Circle": "Dark Circle Comics",
|
|
|
|
"Archie Adventure Series": "Archie Adventure Series",
|
|
|
|
"Radio Comics": "Mighty Comics Group",
|
|
|
|
"Mighty Comics Group": "Mighty Comics Group",
|
|
|
|
},
|
|
|
|
)
|
2020-06-02 20:03:48 -07:00
|
|
|
publishers = [Marvel, DC_Comics, Dark_Horse_Comics, Archie_Comics]
|