comictagger/comicapi/utils.py

"""Some generic utilities"""
# Copyright 2012-2014 ComicTagger Authors
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from __future__ import annotations

import json
import logging
import os
import pathlib
import platform
import unicodedata
from collections import defaultdict
from collections.abc import Iterable, Mapping
from shutil import which  # noqa: F401
from typing import Any

import comicapi.data
from comicapi import filenamelexer, filenameparser

try:
    import icu

    del icu
    icu_available = True
except ImportError:
    icu_available = False

logger = logging.getLogger(__name__)


def _custom_key(tup):
    import natsort

    lst = []
    for x in natsort.os_sort_keygen()(tup):
        ret = x
        if len(x) > 1 and isinstance(x[1], int) and isinstance(x[0], str) and x[0] == "":
            ret = ("a", *x[1:])

        lst.append(ret)
    return tuple(lst)


def os_sorted(lst: Iterable) -> Iterable:
    import natsort

    key = _custom_key
    if icu_available or platform.system() == "Windows":
        key = natsort.os_sort_keygen()
    return sorted(lst, key=key)


def parse_filename(
    filename: str,
    complicated_parser: bool = False,
    remove_c2c: bool = False,
    remove_fcbd: bool = False,
    remove_publisher: bool = False,
    split_words: bool = False,
    allow_issue_start_with_letter: bool = False,
    protofolius_issue_number_scheme: bool = False,
) -> filenameparser.FilenameInfo:
    if not filename:
        return filenameparser.FilenameInfo(
            alternate="",
            annual=False,
            archive="",
            c2c=False,
            fcbd=False,
            issue="",
            issue_count="",
            publisher="",
            remainder="",
            series="",
            title="",
            volume="",
            volume_count="",
            year="",
            format="",
        )
    if split_words:
        import wordninja

        filename, ext = os.path.splitext(filename)
        filename = " ".join(wordninja.split(filename)) + ext

    if complicated_parser:
        lex = filenamelexer.Lex(filename, allow_issue_start_with_letter)
        p = filenameparser.Parse(
            lex.items,
            remove_c2c=remove_c2c,
            remove_fcbd=remove_fcbd,
            remove_publisher=remove_publisher,
            protofolius_issue_number_scheme=protofolius_issue_number_scheme,
        )
        return p.filename_info
    else:
        fnp = filenameparser.FileNameParser()
        fnp.parse_filename(filename)
        fni = filenameparser.FilenameInfo(
            alternate="",
            annual=False,
            archive="",
            c2c=False,
            fcbd=False,
            issue=fnp.issue,
            issue_count=fnp.issue_count,
            publisher="",
            remainder=fnp.remainder,
            series=fnp.series,
            title="",
            volume=fnp.volume,
            volume_count="",
            year=fnp.year,
            format="",
        )
        return fni


def combine_notes(existing_notes: str | None, new_notes: str | None, split: str) -> str:
    split_notes, split_str, untouched_notes = (existing_notes or "").rpartition(split)
    if split_notes or split_str:
        return (split_notes + (new_notes or "")).strip()
    else:
        return (untouched_notes + "\n" + (new_notes or "")).strip()


def parse_date_str(date_str: str | None) -> tuple[int | None, int | None, int | None]:
    day = None
    month = None
    year = None
    if date_str:
        parts = date_str.split("-")
        year = xlate_int(parts[0])
        if len(parts) > 1:
            month = xlate_int(parts[1])
            if len(parts) > 2:
                day = xlate_int(parts[2])
    return day, month, year


def get_recursive_filelist(pathlist: list[str]) -> list[str]:
    """Get a recursive list of of all files under all path items in the list"""

    filelist: list[str] = []
    for p in pathlist:
        if os.path.isdir(p):
            for root, _, files in os.walk(p):
                for f in files:
                    filelist.append(os.path.join(root, f))
        elif os.path.exists(p):
            filelist.append(p)

    return filelist


def add_to_path(dirname: str) -> None:
    if dirname:
        dirname = os.path.abspath(dirname)
        paths = [os.path.normpath(x) for x in split(os.environ["PATH"], os.pathsep)]

        if dirname not in paths:
            paths.insert(0, dirname)
            os.environ["PATH"] = os.pathsep.join(paths)


def xlate_int(data: Any) -> int | None:
    data = xlate_float(data)
    if data is None:
        return None
    return int(data)


def xlate_float(data: Any) -> float | None:
    if isinstance(data, str):
        data = data.strip()
    if data is None or data == "":
        return None
    i: str | int | float
    if isinstance(data, (int, float)):
        i = data
    else:
        i = str(data).translate(defaultdict(lambda: None, zip((ord(c) for c in "1234567890."), "1234567890.")))
    if i == "":
        return None
    try:
        return float(i)
    except ValueError:
        return None


def xlate(data: Any) -> str | None:
    if data is None or isinstance(data, str) and data.strip() == "":
        return None

    return str(data).strip()


def split(s: str | None, c: str) -> list[str]:
    s = xlate(s)
    if s:
        return [x.strip() for x in s.strip().split(c) if x.strip()]
    return []


def remove_articles(text: str) -> str:
    text = text.casefold()
    articles = [
        "&",
        "a",
        "am",
        "an",
        "and",
        "as",
        "at",
        "be",
        "but",
        "by",
        "for",
        "if",
        "is",
        "issue",
        "it",
        "it's",
        "its",
        "itself",
        "of",
        "or",
        "so",
        "the",
        "the",
        "with",
    ]
    new_text = ""
    for word in text.split():
        if word not in articles:
            new_text += word + " "

    new_text = new_text[:-1]

    return new_text


def sanitize_title(text: str, basic: bool = False) -> str:
    # normalize unicode and convert to ascii. Does not work for everything eg ½ to 1⁄2 not 1/2
    text = unicodedata.normalize("NFKD", text).casefold()
    # comicvine keeps apostrophes a part of the word
    text = text.replace("'", "")
    text = text.replace('"', "")
    if not basic:
        # comicvine ignores punctuation and accents
        # remove all characters that are not a letter, separator (space) or number
        # replace any "dash punctuation" with a space
        # makes sure that batman-superman and self-proclaimed stay separate words
        text = "".join(
            c if unicodedata.category(c)[0] not in "P" else " " for c in text if unicodedata.category(c)[0] in "LZNP"
        )
        # remove extra space and articles and all lower case
        text = remove_articles(text).strip()

    return text


def titles_match(search_title: str, record_title: str, threshold: int = 90) -> bool:
    import rapidfuzz.fuzz

    sanitized_search = sanitize_title(search_title)
    sanitized_record = sanitize_title(record_title)
    ratio = int(rapidfuzz.fuzz.ratio(sanitized_search, sanitized_record))
    logger.debug(
        "search title: %s ; record title: %s ; ratio: %d ; match threshold: %d",
        search_title,
        record_title,
        ratio,
        threshold,
    )
    return ratio >= threshold


def unique_file(file_name: pathlib.Path) -> pathlib.Path:
    name = file_name.stem
    counter = 1
    while True:
        if not file_name.exists():
            return file_name
        file_name = file_name.with_stem(name + " (" + str(counter) + ")")
        counter += 1


_languages: dict[str | None, str | None] = defaultdict(lambda: None)

_countries: dict[str | None, str | None] = defaultdict(lambda: None)


def countries() -> dict[str | None, str | None]:
    if not _countries:
        import isocodes

        for alpha_2, c in isocodes.countries.by_alpha_2:
            _countries[alpha_2] = c["name"]
    return _countries


def languages() -> dict[str | None, str | None]:
    if not _languages:
        import isocodes

        for alpha_2, lng in isocodes.extendend_languages._sorted_by_index(index="alpha_2"):
            _languages[alpha_2] = lng["name"]
    return _languages


def get_language_from_iso(iso: str | None) -> str | None:
    return languages()[iso]


def get_language_iso(string: str | None) -> str | None:
    if string is None:
        return None
    import isocodes

    # Return current string if all else fails
    lang = string.casefold()

    found = None
    for lng in isocodes.extendend_languages.items:
        for x in ("alpha_2", "alpha_3", "bibliographic", "common_name", "name"):
            if x in lng and lng[x].casefold() == lang:
                found = lng
        if found:
            break

    if found:
        return found.get("alpha_2", None)
    return lang


def get_country_from_iso(iso: str | None) -> str | None:
    return countries()[iso]


def get_publisher(publisher: str) -> tuple[str, str]:
    imprint = ""

    for pub in publishers.values():
        imprint, publisher, ok = pub[publisher]
        if ok:
            break

    return imprint, publisher


def update_publishers(new_publishers: Mapping[str, Mapping[str, str]]) -> None:
    for publisher in new_publishers:
        if publisher in publishers:
            publishers[publisher].update(new_publishers[publisher])
        else:
            publishers[publisher] = ImprintDict(publisher, new_publishers[publisher])


class ImprintDict(dict):  # type: ignore
    """
    ImprintDict takes a publisher and a dict or mapping of lowercased
    imprint names to the proper imprint name. Retrieving a value from an
    ImprintDict returns a tuple of (imprint, publisher, keyExists).
    if the key does not exist the key is returned as the publisher unchanged
    """

    def __init__(self, publisher: str, mapping: tuple | Mapping = (), **kwargs: dict) -> None:  # type: ignore
        super().__init__(mapping, **kwargs)
        self.publisher = publisher

    def __missing__(self, key: str) -> None:
        return None

    def __getitem__(self, k: str) -> tuple[str, str, bool]:
        item = super().__getitem__(k.casefold())
        if k.casefold() == self.publisher.casefold():
            return "", self.publisher, True
        if item is None:
            return "", k, False
        else:
            return item, self.publisher, True

    def copy(self) -> ImprintDict:
        return ImprintDict(self.publisher, super().copy())


publishers: dict[str, ImprintDict] = {}


def load_publishers() -> None:
    try:
        update_publishers(json.loads((comicapi.data.data_path / "publishers.json").read_text("utf-8")))
    except Exception:
        logger.exception("Failed to load publishers.json; The are no publishers or imprints loaded")
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								"""Some generic utilities"""
-												Update copyright statements to ComicTagger Authors

											
										
										
											2023-02-16 17:23:13 -08:00
+								# Copyright 2012-2014 ComicTagger Authors
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								#
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								# Licensed under the Apache License, Version 2.0 (the "License");
 								# you may not use this file except in compliance with the License.
 								# You may obtain a copy of the License at
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								#
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								#     http://www.apache.org/licenses/LICENSE-2.0
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								#
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								# Unless required by applicable law or agreed to in writing, software
 								# distributed under the License is distributed on an "AS IS" BASIS,
 								# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								# See the License for the specific language governing permissions and
 								# limitations under the License.
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								from __future__ import annotations
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								import json
-												Add basic logging

											
										
										
											2022-04-04 18:59:26 -07:00
+								import logging
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
+								import os
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								import pathlib
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								import platform
-												Improve issue identification

Move title sanitizing code to utils module
Update issue identifier to compare sanitized names

											
										
										
											2021-09-26 17:06:30 -07:00
+								import unicodedata
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								from collections import defaultdict
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								from collections.abc import Iterable, Mapping
-												fix rar test

											
										
										
											2022-06-06 16:58:27 -07:00
+								from shutil import which  # noqa: F401
-												Update dependencies

Includes changes from pyupgrade

											
										
										
											2022-08-10 16:46:00 -07:00
+								from typing import Any
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Update PyInstaller usage

Switch to rapidfuzz from thefuzz
Add associations to macOS app bundle

											
										
										
											2022-10-25 21:48:01 -07:00
+								import comicapi.data
-												Implement support for protofolius's permission scheme

											
										
										
											2023-09-06 01:50:05 -07:00
+								from comicapi import filenamelexer, filenameparser
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								try:
 								    import icu
 								    del icu
 								    icu_available = True
 								except ImportError:
 								    icu_available = False
-												Add basic logging

											
										
										
											2022-04-04 18:59:26 -07:00
+								logger = logging.getLogger(__name__)
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								def _custom_key(tup):
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    import natsort
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								    lst = []
 								    for x in natsort.os_sort_keygen()(tup):
 								        ret = x
 								        if len(x) > 1 and isinstance(x[1], int) and isinstance(x[0], str) and x[0] == "":
 								            ret = ("a", *x[1:])
 								        lst.append(ret)
 								    return tuple(lst)
 								def os_sorted(lst: Iterable) -> Iterable:
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    import natsort
-												Make PyICU optional

Update README.md

											
										
										
											2023-04-22 22:00:26 -07:00
+								    key = _custom_key
 								    if icu_available or platform.system() == "Windows":
 								        key = natsort.os_sort_keygen()
 								    return sorted(lst, key=key)
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Implement support for protofolius's permission scheme

											
										
										
											2023-09-06 01:50:05 -07:00
+								def parse_filename(
 								    filename: str,
 								    complicated_parser: bool = False,
 								    remove_c2c: bool = False,
 								    remove_fcbd: bool = False,
 								    remove_publisher: bool = False,
 								    split_words: bool = False,
 								    allow_issue_start_with_letter: bool = False,
 								    protofolius_issue_number_scheme: bool = False,
 								) -> filenameparser.FilenameInfo:
-												Ensure FilenameInfo is always filled out fixes #556

											
										
										
											2023-10-23 21:08:55 -07:00
+								    if not filename:
 								        return filenameparser.FilenameInfo(
 								            alternate="",
 								            annual=False,
 								            archive="",
 								            c2c=False,
 								            fcbd=False,
 								            issue="",
 								            issue_count="",
 								            publisher="",
 								            remainder="",
 								            series="",
 								            title="",
 								            volume="",
 								            volume_count="",
 								            year="",
 								            format="",
 								        )
-												Implement support for protofolius's permission scheme

											
										
										
											2023-09-06 01:50:05 -07:00
+								    if split_words:
 								        import wordninja
 								        filename, ext = os.path.splitext(filename)
 								        filename = " ".join(wordninja.split(filename)) + ext
 								    if complicated_parser:
 								        lex = filenamelexer.Lex(filename, allow_issue_start_with_letter)
 								        p = filenameparser.Parse(
 								            lex.items,
 								            remove_c2c=remove_c2c,
 								            remove_fcbd=remove_fcbd,
 								            remove_publisher=remove_publisher,
 								            protofolius_issue_number_scheme=protofolius_issue_number_scheme,
 								        )
 								        return p.filename_info
 								    else:
 								        fnp = filenameparser.FileNameParser()
 								        fnp.parse_filename(filename)
-												Ensure FilenameInfo is always filled out fixes #556

											
										
										
											2023-10-23 21:08:55 -07:00
+								        fni = filenameparser.FilenameInfo(
 								            alternate="",
 								            annual=False,
 								            archive="",
 								            c2c=False,
 								            fcbd=False,
 								            issue=fnp.issue,
 								            issue_count=fnp.issue_count,
 								            publisher="",
 								            remainder=fnp.remainder,
 								            series=fnp.series,
 								            title="",
 								            volume=fnp.volume,
 								            volume_count="",
 								            year=fnp.year,
 								            format="",
 								        )
-												Implement support for protofolius's permission scheme

											
										
										
											2023-09-06 01:50:05 -07:00
+								        return fni
-												Append notes instead of overwriting them

Add issue_id to GenericMetadata

											
										
										
											2022-11-04 15:39:40 -07:00
+								def combine_notes(existing_notes: str | None, new_notes: str | None, split: str) -> str:
-												Fix issue with combine_notes

											
										
										
											2022-11-24 01:24:15 -08:00
+								    split_notes, split_str, untouched_notes = (existing_notes or "").rpartition(split)
 								    if split_notes or split_str:
-												Append notes instead of overwriting them

Add issue_id to GenericMetadata

											
										
										
											2022-11-04 15:39:40 -07:00
+								        return (split_notes + (new_notes or "")).strip()
 								    else:
 								        return (untouched_notes + "\n" + (new_notes or "")).strip()
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								def parse_date_str(date_str: str | None) -> tuple[int | None, int | None, int | None]:
-												Fix serializing of sets

											
										
										
											2022-07-25 11:22:44 -07:00
+								    day = None
 								    month = None
 								    year = None
 								    if date_str:
 								        parts = date_str.split("-")
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								        year = xlate_int(parts[0])
-												Fix serializing of sets

											
										
										
											2022-07-25 11:22:44 -07:00
+								        if len(parts) > 1:
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								            month = xlate_int(parts[1])
-												Fix serializing of sets

											
										
										
											2022-07-25 11:22:44 -07:00
+								            if len(parts) > 2:
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								                day = xlate_int(parts[2])
-												Fix serializing of sets

											
										
										
											2022-07-25 11:22:44 -07:00
+								    return day, month, year
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								def get_recursive_filelist(pathlist: list[str]) -> list[str]:
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								    """Get a recursive list of of all files under all path items in the list"""
-												Updates

Use casefold in place of lower
Make lint job fail if errors are detected
Use join instead of utils.list_to_string
Simplify get_recursive_filelist with the glob library
Fix handling of un-parseable numbers in xlate

											
										
										
											2022-07-01 16:22:01 -07:00
+								    filelist: list[str] = []
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								    for p in pathlist:
 								        if os.path.isdir(p):
-												Revert get_recursive_filelist Fixes #449

											
										
										
											2023-04-13 19:58:30 -07:00
+								            for root, _, files in os.walk(p):
 								                for f in files:
 								                    filelist.append(os.path.join(root, f))
-												Fix folder archiver

Implement supports_comment and is_writable
Fix function call in ComicArchive for supports_comment
Add a menu option to open a folder as an archive

											
										
										
											2023-07-29 00:07:25 -07:00
+								        elif os.path.exists(p):
-												Revert get_recursive_filelist Fixes #449

											
										
										
											2023-04-13 19:58:30 -07:00
+								            filelist.append(p)
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
 								    return filelist
-												Typed

											
										
										
											2022-05-17 13:57:04 -07:00
+								def add_to_path(dirname: str) -> None:
-												Fix issues

Refactor add_to_path with tests
Fix type hints for titles_match
Use casefold in get_language
Fix using the recursive flag in cli mode
Add http status code to ComicVine exceptions
Fix parenthesis getting removed when renaming
Add more tests

											
										
										
											2022-08-08 18:03:29 -07:00
+								    if dirname:
 								        dirname = os.path.abspath(dirname)
-												Convert ComicIssue into GenericMetadata

I could not find a good reason for ComicIssue to exist other than that
 it had more attributes than GenericMetadata, so it has been replaced.
New attributes for GenericMetadata:
  series_id:        a string uniquely identifying the series to tag_origin
  series_aliases:   alternate series names that are not the canonical name
  title_aliases:    alternate issue titles that are not the canonical name
  alternate_images: a list of urls to alternate cover images

Updated attributes for GenericMetadata:
  genre        -> genres:        str -> list[str]
  comments     -> description:   str -> str
  story_arc    -> story_arcs:    str -> list[str]
  series_group -> series_groups: str -> list[str]
  character    -> characters:    str -> list[str]
  team         -> teams:         str -> list[str]
  location     -> locations:     str -> list[str]
  tag_origin   -> tag_origin:    str -> TagOrigin (tuple[str, str])

ComicSeries has been relocated to the ComicAPI package, currently has no
 usage within ComicAPI.
CreditMetadata has been renamed to Credit and has replaced Credit from
 ComicTalker.
fetch_series has been added to ComicTalker, this is currently only used
 in the GUI when a series is selected and does not already contain the
 needed fields, this function should always be cached.

A new split function has been added to ComicAPI, all uses of split on
 single characters have been updated to use this

cleanup_html and the corresponding setting are now only used in
 ComicTagger proper, for display we want any html directly from the
 upstream. When applying the metadata we then strip the description of
 any html.

A new conversion has been added to the MetadataFormatter:
  j: joins any lists into a string with ', '. Note this is a valid
     operation on strings as well, it will add ', ' in between every
     character.

parse_settings now assigns the given ComicTaggerPaths object to the
 result ensuring that the correct path is always used.

											
										
										
											2023-08-02 09:00:04 -07:00
+								        paths = [os.path.normpath(x) for x in split(os.environ["PATH"], os.pathsep)]
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
-												Fix issues

Refactor add_to_path with tests
Fix type hints for titles_match
Use casefold in get_language
Fix using the recursive flag in cli mode
Add http status code to ComicVine exceptions
Fix parenthesis getting removed when renaming
Add more tests

											
										
										
											2022-08-08 18:03:29 -07:00
+								        if dirname not in paths:
 								            paths.insert(0, dirname)
 								            os.environ["PATH"] = os.pathsep.join(paths)
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								def xlate_int(data: Any) -> int | None:
 								    data = xlate_float(data)
 								    if data is None:
 								        return None
 								    return int(data)
 								def xlate_float(data: Any) -> float | None:
-												Fix setting issue and alternate_number on GenericMetadata

IssueString.as_string always returns a string this is a problem for
  GenericMetadata. When the overlay function is used it checks
  specifically for the value None this allows the -m option to unset
  attributes however the issue attribute would get set to the empty
  string when loading ComicRack tags regardless of if there was a value
  stored in the file. Fixes #465 and #480

											
										
										
											2023-06-15 20:25:19 -07:00
+								    if isinstance(data, str):
 								        data = data.strip()
-												Separate xlate into separate functions based on return type fixes #454

											
										
										
											2023-04-25 00:55:23 -07:00
+								    if data is None or data == "":
 								        return None
 								    i: str | int | float
 								    if isinstance(data, (int, float)):
 								        i = data
 								    else:
 								        i = str(data).translate(defaultdict(lambda: None, zip((ord(c) for c in "1234567890."), "1234567890.")))
 								    if i == "":
 								        return None
 								    try:
 								        return float(i)
 								    except ValueError:
 								        return None
 								def xlate(data: Any) -> str | None:
-												Fix setting issue and alternate_number on GenericMetadata

IssueString.as_string always returns a string this is a problem for
  GenericMetadata. When the overlay function is used it checks
  specifically for the value None this allows the -m option to unset
  attributes however the issue attribute would get set to the empty
  string when loading ComicRack tags regardless of if there was a value
  stored in the file. Fixes #465 and #480

											
										
										
											2023-06-15 20:25:19 -07:00
+								    if data is None or isinstance(data, str) and data.strip() == "":
-												Cleanup metadata handling

Mainly corrects for consistency in most situations
CoMet is not touched as there is no support in the gui and has an odd requirements on attributes

											
										
										
											2021-08-07 21:54:29 -07:00
+								        return None
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Convert ComicIssue into GenericMetadata

I could not find a good reason for ComicIssue to exist other than that
 it had more attributes than GenericMetadata, so it has been replaced.
New attributes for GenericMetadata:
  series_id:        a string uniquely identifying the series to tag_origin
  series_aliases:   alternate series names that are not the canonical name
  title_aliases:    alternate issue titles that are not the canonical name
  alternate_images: a list of urls to alternate cover images

Updated attributes for GenericMetadata:
  genre        -> genres:        str -> list[str]
  comments     -> description:   str -> str
  story_arc    -> story_arcs:    str -> list[str]
  series_group -> series_groups: str -> list[str]
  character    -> characters:    str -> list[str]
  team         -> teams:         str -> list[str]
  location     -> locations:     str -> list[str]
  tag_origin   -> tag_origin:    str -> TagOrigin (tuple[str, str])

ComicSeries has been relocated to the ComicAPI package, currently has no
 usage within ComicAPI.
CreditMetadata has been renamed to Credit and has replaced Credit from
 ComicTalker.
fetch_series has been added to ComicTalker, this is currently only used
 in the GUI when a series is selected and does not already contain the
 needed fields, this function should always be cached.

A new split function has been added to ComicAPI, all uses of split on
 single characters have been updated to use this

cleanup_html and the corresponding setting are now only used in
 ComicTagger proper, for display we want any html directly from the
 upstream. When applying the metadata we then strip the description of
 any html.

A new conversion has been added to the MetadataFormatter:
  j: joins any lists into a string with ', '. Note this is a valid
     operation on strings as well, it will add ', ' in between every
     character.

parse_settings now assigns the given ComicTaggerPaths object to the
 result ensuring that the correct path is always used.

											
										
										
											2023-08-02 09:00:04 -07:00
+								    return str(data).strip()
 								def split(s: str | None, c: str) -> list[str]:
 								    s = xlate(s)
 								    if s:
 								        return [x.strip() for x in s.strip().split(c) if x.strip()]
 								    return []
-												Cleanup metadata handling

Mainly corrects for consistency in most situations
CoMet is not touched as there is no support in the gui and has an odd requirements on attributes

											
										
										
											2021-08-07 21:54:29 -07:00
-												Typed

											
										
										
											2022-05-17 13:57:04 -07:00
+								def remove_articles(text: str) -> str:
-												Updates

Use casefold in place of lower
Make lint job fail if errors are detected
Use join instead of utils.list_to_string
Simplify get_recursive_filelist with the glob library
Fix handling of un-parseable numbers in xlate

											
										
										
											2022-07-01 16:22:01 -07:00
+								    text = text.casefold()
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								    articles = [
 								        "&",
 								        "a",
 								        "am",
 								        "an",
 								        "and",
 								        "as",
 								        "at",
 								        "be",
 								        "but",
 								        "by",
 								        "for",
 								        "if",
 								        "is",
 								        "issue",
 								        "it",
 								        "it's",
 								        "its",
 								        "itself",
 								        "of",
 								        "or",
 								        "so",
 								        "the",
 								        "the",
 								        "with",
 								    ]
 								    new_text = ""
-												Fix #353

The two primary cases fixed are:
Ms. Marvel
spider-man/deadpool

The first issue removed 'Ms.' which is a problem as many comics have
series that the only difference in the title is the
designation/honorific.

The second issue is that the '/' was removed and not replaced with
anything causing a search for 'mandeadpool' which will not show useful
results.

Consequently all designations/honorifics are now untouched
All punctuation is replaced with a space

											
										
										
											2022-08-12 07:10:36 -07:00
+								    for word in text.split():
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								        if word not in articles:
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								            new_text += word + " "
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								    new_text = new_text[:-1]
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								    return new_text
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Add a literal search option

											
										
										
											2022-06-07 11:49:56 -07:00
+								def sanitize_title(text: str, basic: bool = False) -> str:
-												Improve issue identification

Move title sanitizing code to utils module
Update issue identifier to compare sanitized names

											
										
										
											2021-09-26 17:06:30 -07:00
+								    # normalize unicode and convert to ascii. Does not work for everything eg ½ to 1⁄2 not 1/2
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
+								    text = unicodedata.normalize("NFKD", text).casefold()
-												Fix #353

The two primary cases fixed are:
Ms. Marvel
spider-man/deadpool

The first issue removed 'Ms.' which is a problem as many comics have
series that the only difference in the title is the
designation/honorific.

The second issue is that the '/' was removed and not replaced with
anything causing a search for 'mandeadpool' which will not show useful
results.

Consequently all designations/honorifics are now untouched
All punctuation is replaced with a space

											
										
										
											2022-08-12 07:10:36 -07:00
+								    # comicvine keeps apostrophes a part of the word
 								    text = text.replace("'", "")
 								    text = text.replace('"', "")
 								    if not basic:
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
+								        # comicvine ignores punctuation and accents
 								        # remove all characters that are not a letter, separator (space) or number
 								        # replace any "dash punctuation" with a space
 								        # makes sure that batman-superman and self-proclaimed stay separate words
 								        text = "".join(
-												Fix #353

The two primary cases fixed are:
Ms. Marvel
spider-man/deadpool

The first issue removed 'Ms.' which is a problem as many comics have
series that the only difference in the title is the
designation/honorific.

The second issue is that the '/' was removed and not replaced with
anything causing a search for 'mandeadpool' which will not show useful
results.

Consequently all designations/honorifics are now untouched
All punctuation is replaced with a space

											
										
										
											2022-08-12 07:10:36 -07:00
+								            c if unicodedata.category(c)[0] not in "P" else " " for c in text if unicodedata.category(c)[0] in "LZNP"
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
+								        )
-												Add a literal search option

											
										
										
											2022-06-07 11:49:56 -07:00
+								        # remove extra space and articles and all lower case
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
+								        text = remove_articles(text).strip()
-												Improve issue identification

Move title sanitizing code to utils module
Update issue identifier to compare sanitized names

											
										
										
											2021-09-26 17:06:30 -07:00
 								    return text
-												Fix issues

Refactor add_to_path with tests
Fix type hints for titles_match
Use casefold in get_language
Fix using the recursive flag in cli mode
Add http status code to ComicVine exceptions
Fix parenthesis getting removed when renaming
Add more tests

											
										
										
											2022-08-08 18:03:29 -07:00
+								def titles_match(search_title: str, record_title: str, threshold: int = 90) -> bool:
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    import rapidfuzz.fuzz
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
+								    sanitized_search = sanitize_title(search_title)
 								    sanitized_record = sanitize_title(record_title)
-												clean up talker

											
										
										
											2023-02-09 19:33:10 -08:00
+								    ratio = int(rapidfuzz.fuzz.ratio(sanitized_search, sanitized_record))
-												use thefuzz

use thefuzz

use thefuzz

											
										
										
											2022-07-08 12:33:00 -07:00
+								    logger.debug(
 								        "search title: %s ; record title: %s ; ratio: %d ; match threshold: %d",
 								        search_title,
 								        record_title,
 								        ratio,
 								        threshold,
 								    )
 								    return ratio >= threshold
-												Allow non-ascii in ComicVine searches

											
										
										
											2022-07-09 23:26:30 -07:00
-												Improve rename

Implement rename on ComicArchive
Simplify unique_file with pathlib
Fix issues during renaming and simplify with pathlib
Allow exporting as zip to export 7-zip archives

											
										
										
											2022-07-09 22:27:45 -07:00
+								def unique_file(file_name: pathlib.Path) -> pathlib.Path:
-												Fix renaming

Make ComicArchive.path always absolute
Fix unique_file not preserving the extension
Fix incorrect output when renaming in CLI mode
Fix handling of platform when renaming

											
										
										
											2022-08-19 20:20:37 -07:00
+								    name = file_name.stem
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								    counter = 1
 								    while True:
-												Improve rename

Implement rename on ComicArchive
Simplify unique_file with pathlib
Fix issues during renaming and simplify with pathlib
Allow exporting as zip to export 7-zip archives

											
										
										
											2022-07-09 22:27:45 -07:00
+								        if not file_name.exists():
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								            return file_name
-												Fix renaming

Make ComicArchive.path always absolute
Fix unique_file not preserving the extension
Fix incorrect output when renaming in CLI mode
Fix handling of platform when renaming

											
										
										
											2022-08-19 20:20:37 -07:00
+								        file_name = file_name.with_stem(name + " (" + str(counter) + ")")
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								        counter += 1
-												Squashed 'comicapi/' content from commit b7d2458

git-subtree-dir: comicapi
git-subtree-split: b7d2458b80467a47be1d1d58b31ffcac62c2743c

											
										
										
											2015-02-16 04:27:21 -08:00
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								_languages: dict[str | None, str | None] = defaultdict(lambda: None)
 								_countries: dict[str | None, str | None] = defaultdict(lambda: None)
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								def countries() -> dict[str | None, str | None]:
 								    if not _countries:
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								        import isocodes
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								        for alpha_2, c in isocodes.countries.by_alpha_2:
 								            _countries[alpha_2] = c["name"]
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    return _countries
 								def languages() -> dict[str | None, str | None]:
 								    if not _languages:
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								        import isocodes
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								        for alpha_2, lng in isocodes.extendend_languages._sorted_by_index(index="alpha_2"):
 								            _languages[alpha_2] = lng["name"]
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    return _languages
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								def get_language_from_iso(iso: str | None) -> str | None:
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    return languages()[iso]
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Fix CBL tagging

											
										
										
											2022-10-02 19:33:12 -07:00
+								def get_language_iso(string: str | None) -> str | None:
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								    if string is None:
-												Huge code cleanup

- `autopep8 -aa` for general cleanup;
- Changed order of imports, they should be ordered into 3 groups:
1. standard library imports;
2. 3rd party packages;
3. project imports.
- I commented various imports that were reported as unused by my IDE.
If everything goes fine we can consider to delete them;
- The Apache license disclaimers are now comments since triple-quotes
should be used only for docstrings;
- Fix - `utils.centerWindowOnParent` did not resolve, changed to
`centerWindowOnParent`

											
										
										
											2015-02-21 18:30:32 -08:00
+								        return None
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								    import isocodes
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
-												Remove attempted validation of language and country plus minor changes

											
										
										
											2023-05-24 17:32:52 -07:00
+								    # Return current string if all else fails
-												Fix CBL tagging

											
										
										
											2022-10-02 19:33:12 -07:00
+								    lang = string.casefold()
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
-												Replace pycountry with isocodes

isocodes is updated more often and doesn't depend on deprecated packages

											
										
										
											2023-11-23 14:21:21 -08:00
+								    found = None
 								    for lng in isocodes.extendend_languages.items:
 								        for x in ("alpha_2", "alpha_3", "bibliographic", "common_name", "name"):
 								            if x in lng and lng[x].casefold() == lang:
 								                found = lng
 								        if found:
 								            break
 								    if found:
 								        return found.get("alpha_2", None)
-												Code cleanup

Remove no longer used google scripts
Remove convenience files from comicataggerlib and import comicapi directly
Add type-hints to facilitate auto-complete tools
Make PyQt5 code more compatible with PyQt6

Implement automatic tooling
isort and black for code formatting
Line length has been set to 120
flake8 for code standards with exceptions:
E203 - Whitespace before ':'  - format compatiblity with black
E501 - Line too long          - flake8 line limit cannot be set
E722 - Do not use bare except - fixing bare except statements is a
                                lot of overhead and there are already
                                many in the codebase

These changes, along with some manual fixes creates much more readable code.
See examples below:

diff --git a/comicapi/comet.py b/comicapi/comet.py
index d1741c5..52dc195 100644
--- a/comicapi/comet.py
+++ b/comicapi/comet.py
@@ -166,7 +166,2 @@ class CoMet:

-            if credit['role'].lower() in set(self.editor_synonyms):
-                ET.SubElement(
-                    root,
-                    'editor').text = "{0}".format(
-                    credit['person'])

@@ -174,2 +169,4 @@ class CoMet:
         self.indent(root)
+            if credit["role"].lower() in set(self.editor_synonyms):
+                ET.SubElement(root, "editor").text = str(credit["person"])

diff --git a/comictaggerlib/autotagmatchwindow.py b/comictaggerlib/autotagmatchwindow.py
index 4338176..9219f01 100644
--- a/comictaggerlib/autotagmatchwindow.py
+++ b/comictaggerlib/autotagmatchwindow.py
@@ -63,4 +63,3 @@ class AutoTagMatchWindow(QtWidgets.QDialog):
             self.skipButton, QtWidgets.QDialogButtonBox.ActionRole)
-        self.buttonBox.button(QtWidgets.QDialogButtonBox.Ok).setText(
-            "Accept and Write Tags")
+        self.buttonBox.button(QtWidgets.QDialogButtonBox.StandardButton.Ok).setText("Accept and Write Tags")

diff --git a/comictaggerlib/cli.py b/comictaggerlib/cli.py
index 688907d..dbd0c2e 100644
--- a/comictaggerlib/cli.py
+++ b/comictaggerlib/cli.py
@@ -293,7 +293,3 @@ def process_file_cli(filename, opts, settings, match_results):
                 if opts.raw:
-                    print((
-                        "{0}".format(
-                            str(
-                                ca.readRawCIX(),
-                                errors='ignore'))))
+                    print(ca.read_raw_cix())
                 else:

											
										
										
											2022-04-01 16:50:46 -07:00
+								    return lang
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
-												Add country functions to utils and try to convert a country name to ISO country name

											
										
										
											2023-05-22 16:02:56 -07:00
+								def get_country_from_iso(iso: str | None) -> str | None:
-												Reduce startup time

											
										
										
											2023-06-22 20:11:40 -07:00
+								    return countries()[iso]
-												Add country functions to utils and try to convert a country name to ISO country name

											
										
										
											2023-05-22 16:02:56 -07:00
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								def get_publisher(publisher: str) -> tuple[str, str]:
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								    imprint = ""
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    for pub in publishers.values():
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								        imprint, publisher, ok = pub[publisher]
 								        if ok:
 								            break
-												Generate a namespace object for typing settngs

											
										
										
											2023-06-09 16:20:00 -07:00
+								    return imprint, publisher
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								def update_publishers(new_publishers: Mapping[str, Mapping[str, str]]) -> None:
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    for publisher in new_publishers:
 								        if publisher in publishers:
 								            publishers[publisher].update(new_publishers[publisher])
 								        else:
 								            publishers[publisher] = ImprintDict(publisher, new_publishers[publisher])
-												Update Settings

											
										
										
											2022-12-06 00:20:01 -08:00
+								class ImprintDict(dict):  # type: ignore
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    """
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								    ImprintDict takes a publisher and a dict or mapping of lowercased
-												Fix small issues

Fix spelling errors
Remove Redundant exception types
Remove dead code
Change the forum link to point to GitHub discussions

											
										
										
											2022-06-07 20:22:33 -07:00
+								    imprint names to the proper imprint name. Retrieving a value from an
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								    ImprintDict returns a tuple of (imprint, publisher, keyExists).
 								    if the key does not exist the key is returned as the publisher unchanged
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    """
-												Update Settings

											
										
										
											2022-12-06 00:20:01 -08:00
+								    def __init__(self, publisher: str, mapping: tuple | Mapping = (), **kwargs: dict) -> None:  # type: ignore
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								        super().__init__(mapping, **kwargs)
 								        self.publisher = publisher
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    def __missing__(self, key: str) -> None:
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								        return None
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
+								    def __getitem__(self, k: str) -> tuple[str, str, bool]:
 								        item = super().__getitem__(k.casefold())
 								        if k.casefold() == self.publisher.casefold():
-												Generate a namespace object for typing settngs

											
										
										
											2023-06-09 16:20:00 -07:00
+								            return "", self.publisher, True
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								        if item is None:
-												Generate a namespace object for typing settngs

											
										
										
											2023-06-09 16:20:00 -07:00
+								            return "", k, False
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
+								        else:
-												Generate a namespace object for typing settngs

											
										
										
											2023-06-09 16:20:00 -07:00
+								            return item, self.publisher, True
-												Add publisher and imprint handling

Imprint handling has been added to utils and uses a subclassed dict to
return a tuple for imprint matching, this may not be the best idea but
it works for now.

Add settings option auto_imprint
Add cli flag -a, --auto-import

											
										
										
											2021-08-07 21:50:45 -07:00
-												Apply pre-commit configuration

											
										
										
											2022-06-02 18:32:16 -07:00
+								    def copy(self) -> ImprintDict:
-												Add tests

											
										
										
											2022-05-21 00:16:45 -07:00
+								        return ImprintDict(self.publisher, super().copy())
-												Merge branch 'AutoImprint' into develop

											
										
										
											2022-05-19 13:28:18 -07:00
 								publishers: dict[str, ImprintDict] = {}
 								def load_publishers() -> None:
-												Fix crash on startup

Add publishers.json to pip package
Add exception handling to prevent crash

											
										
										
											2022-05-19 20:13:59 -07:00
+								    try:
-												Update PyInstaller usage

Switch to rapidfuzz from thefuzz
Add associations to macOS app bundle

											
										
										
											2022-10-25 21:48:01 -07:00
+								        update_publishers(json.loads((comicapi.data.data_path / "publishers.json").read_text("utf-8")))
-												Fix crash on startup

Add publishers.json to pip package
Add exception handling to prevent crash

											
										
										
											2022-05-19 20:13:59 -07:00
+								    except Exception:
 								        logger.exception("Failed to load publishers.json; The are no publishers or imprints loaded")