df762746ec
for more information, see https://pre-commit.ci
131 lines
4.0 KiB
Python
131 lines
4.0 KiB
Python
"""Support for mixed digit/string type Issue field
|
|
|
|
Class for handling the odd permutations of an 'issue number' that the
|
|
comics industry throws at us.
|
|
e.g.: "12", "12.1", "0", "-1", "5AU", "100-2"
|
|
"""
|
|
|
|
# Copyright 2012-2014 ComicTagger Authors
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
from __future__ import annotations
|
|
|
|
import logging
|
|
import unicodedata
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class IssueString:
|
|
def __init__(self, text: str | None) -> None:
|
|
# break up the issue number string into 2 parts: the numeric and suffix string.
|
|
# (assumes that the numeric portion is always first)
|
|
|
|
self.num = None
|
|
self.suffix = ""
|
|
self.prefix = ""
|
|
|
|
if text is None:
|
|
return
|
|
|
|
text = str(text)
|
|
|
|
if len(text) == 0:
|
|
return
|
|
|
|
for idx, r in enumerate(text):
|
|
if not r.isalpha():
|
|
break
|
|
self.prefix = text[:idx]
|
|
self.num, self.suffix = self.get_number(text[idx:])
|
|
|
|
def get_number(self, text: str) -> tuple[float | None, str]:
|
|
num, suffix = None, ""
|
|
start = 0
|
|
# skip the minus sign if it's first
|
|
if text[0] in ("-", "+"):
|
|
start = 1
|
|
|
|
# if it's still not numeric at start skip it
|
|
if text[start].isdigit() or text[start] == ".":
|
|
# walk through the string, look for split point (the first non-numeric)
|
|
decimal_count = 0
|
|
for idx in range(start, len(text)):
|
|
if not (text[idx].isdigit() or text[idx] in "."):
|
|
break
|
|
# special case: also split on second "."
|
|
if text[idx] == ".":
|
|
decimal_count += 1
|
|
if decimal_count > 1:
|
|
break
|
|
else:
|
|
idx = len(text)
|
|
|
|
# move trailing numeric decimal to suffix
|
|
# (only if there is other junk after )
|
|
if text[idx - 1] == "." and len(text) != idx:
|
|
idx = idx - 1
|
|
|
|
# if there is no numeric after the minus, make the minus part of the suffix
|
|
if idx == 1 and start == 1:
|
|
idx = 0
|
|
|
|
if text[0:idx]:
|
|
num = float(text[0:idx])
|
|
suffix = text[idx : len(text)]
|
|
else:
|
|
suffix = text
|
|
return num, suffix
|
|
|
|
def as_string(self, pad: int = 0) -> str:
|
|
"""return the number, left side zero-padded, with suffix attached"""
|
|
|
|
# if there is no number return the text
|
|
if self.num is None:
|
|
return self.prefix + self.suffix
|
|
|
|
# negative is added back in last
|
|
negative = self.num < 0
|
|
num_f = abs(self.num)
|
|
|
|
# used for padding
|
|
num_int = int(num_f)
|
|
|
|
if num_f.is_integer():
|
|
num_s = str(num_int)
|
|
else:
|
|
num_s = str(num_f)
|
|
|
|
# create padding
|
|
padding = ""
|
|
# we only pad the whole number part, we don't care about the decimal
|
|
length = len(str(num_int))
|
|
if length < pad:
|
|
padding = "0" * (pad - length)
|
|
|
|
# add the padding to the front
|
|
num_s = padding + num_s
|
|
|
|
# finally add the negative back in
|
|
if negative:
|
|
num_s = "-" + num_s
|
|
|
|
# return the prefix + formatted number + suffix
|
|
return self.prefix + num_s + self.suffix
|
|
|
|
def as_float(self) -> float | None:
|
|
# return the float, with no suffix
|
|
if len(self.suffix) == 1 and self.suffix.isnumeric():
|
|
return (self.num or 0) + unicodedata.numeric(self.suffix)
|
|
return self.num
|