Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Update Python 3.7 syntax to 3.8 #956

Merged
merged 5 commits into from
Jul 6, 2024
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 3 additions & 3 deletions pdfminer/converter.py
Original file line number Diff line number Diff line change
Expand Up @@ -458,7 +458,7 @@ def write_header(self) -> None:

def write_footer(self) -> None:
page_links = [
'<a href="#{}">{}</a>'.format(i, i) for i in range(1, self.pageno)
f'<a href="#{i}">{i}</a>' for i in range(1, self.pageno)
]
s = '<div style="position:absolute; top:0px;">Page: %s</div>\n' % ", ".join(
page_links
Expand Down Expand Up @@ -783,7 +783,7 @@ def render(item: LTItem) -> None:
)
self.write(s)
elif isinstance(item, LTFigure):
s = '<figure name="%s" bbox="%s">\n' % (item.name, bbox2str(item.bbox))
s = '<figure name="{}" bbox="{}">\n'.format(item.name, bbox2str(item.bbox))
pietermarsman marked this conversation as resolved.
Show resolved Hide resolved
self.write(s)
for child in item:
render(child)
Expand Down Expand Up @@ -974,7 +974,7 @@ def render(item: LTItem) -> None:
self.write("</div>\n")
elif isinstance(item, LTTextLine):
self.write(
"<span class='ocr_line' title='%s'>" % ((self.bbox_repr(item.bbox)))
"<span class='ocr_line' title='%s'>" % (self.bbox_repr(item.bbox))
)
for child_line in item:
render(child_line)
Expand Down
4 changes: 2 additions & 2 deletions pdfminer/fontmetrics.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ def convert_font_metrics(path: str) -> None:
See below for the output.
"""
fonts = {}
with open(path, "r") as fileinput:
with open(path) as fileinput:
for line in fileinput.readlines():
f = line.strip().split(" ")
if not f:
Expand Down Expand Up @@ -66,7 +66,7 @@ def convert_font_metrics(path: str) -> None:
print("# -*- python -*-")
print("FONT_METRICS = {")
for (fontname, (props, chars)) in fonts.items():
print(" {!r}: {!r},".format(fontname, (props, chars)))
print(f" {fontname!r}: {(props, chars)!r},")
print("}")


Expand Down
2 changes: 1 addition & 1 deletion pdfminer/glyphlist.py
Original file line number Diff line number Diff line change
Expand Up @@ -58,7 +58,7 @@ def convert_glyphlist(path: str) -> None:
See output below.
"""
state = 0
with open(path, "r") as fileinput:
with open(path) as fileinput:
for line in fileinput.readlines():
line = line.strip()
if not line or line.startswith("#"):
Expand Down
16 changes: 8 additions & 8 deletions pdfminer/layout.py
Original file line number Diff line number Diff line change
Expand Up @@ -129,7 +129,7 @@ class LTText:
"""Interface for things that have text"""

def __repr__(self) -> str:
return "<%s %r>" % (self.__class__.__name__, self.get_text())
return "<{} {!r}>".format(self.__class__.__name__, self.get_text())

def get_text(self) -> str:
"""Text contained in this object"""
Expand All @@ -144,7 +144,7 @@ def __init__(self, bbox: Rect) -> None:
self.set_bbox(bbox)

def __repr__(self) -> str:
return "<%s %s>" % (self.__class__.__name__, bbox2str(self.bbox))
return "<{} {}>".format(self.__class__.__name__, bbox2str(self.bbox))

# Disable comparison.
def __lt__(self, _: object) -> bool:
Expand Down Expand Up @@ -330,7 +330,7 @@ def __init__(self, name: str, stream: PDFStream, bbox: Rect) -> None:
self.colorspace = [self.colorspace]

def __repr__(self) -> str:
return "<%s(%s) %s %r>" % (
return "<{}({}) {} {!r}>".format(
self.__class__.__name__,
self.name,
bbox2str(self.bbox),
Expand Down Expand Up @@ -410,7 +410,7 @@ def __init__(
return

def __repr__(self) -> str:
return "<%s %s matrix=%s font=%r adv=%s text=%r>" % (
return "<{} {} matrix={} font={!r} adv={} text={!r}>".format(
self.__class__.__name__,
bbox2str(self.bbox),
matrix2str(self.matrix),
Expand Down Expand Up @@ -503,7 +503,7 @@ def __init__(self, word_margin: float) -> None:
return

def __repr__(self) -> str:
return "<%s %s %r>" % (
return "<{} {} {!r}>".format(
self.__class__.__name__,
bbox2str(self.bbox),
self.get_text(),
Expand Down Expand Up @@ -674,7 +674,7 @@ def __init__(self) -> None:
return

def __repr__(self) -> str:
return "<%s(%s) %s %r>" % (
return "<{}({}) {} {!r}>".format(
self.__class__.__name__,
self.index,
bbox2str(self.bbox),
Expand Down Expand Up @@ -1007,7 +1007,7 @@ def __init__(self, name: str, bbox: Rect, matrix: Matrix) -> None:
return

def __repr__(self) -> str:
return "<%s(%s) %s matrix=%s>" % (
return "<{}({}) {} matrix={}>".format(
self.__class__.__name__,
self.name,
bbox2str(self.bbox),
Expand Down Expand Up @@ -1035,7 +1035,7 @@ def __init__(self, pageid: int, bbox: Rect, rotate: float = 0) -> None:
return

def __repr__(self) -> str:
return "<%s(%r) %s rotate=%r>" % (
return "<{}({!r}) {} rotate={!r}>".format(
self.__class__.__name__,
self.pageid,
bbox2str(self.bbox),
Expand Down
4 changes: 2 additions & 2 deletions pdfminer/pdfdevice.py
Original file line number Diff line number Diff line change
Expand Up @@ -292,11 +292,11 @@ def begin_tag(self, tag: PSLiteral, props: Optional["PDFStackT"] = None) -> None
if isinstance(props, dict):
s = "".join(
[
' {}="{}"'.format(utils.enc(k), utils.make_compat_str(v))
f' {utils.enc(k)}="{utils.make_compat_str(v)}"'
for (k, v) in sorted(props.items())
]
)
out_s = "<{}{}>".format(utils.enc(cast(str, tag.name)), s)
out_s = f"<{utils.enc(cast(str, tag.name))}{s}>"
self._write(out_s)
self._stack.append(tag)
return
Expand Down
6 changes: 3 additions & 3 deletions pdfminer/pdfdocument.py
Original file line number Diff line number Diff line change
Expand Up @@ -158,12 +158,12 @@ def load(self, parser: PDFParser) -> None:
break
f = line.split(b" ")
if len(f) != 2:
error_msg = "Trailer not found: {!r}: line={!r}".format(parser, line)
error_msg = f"Trailer not found: {parser!r}: line={line!r}"
raise PDFNoValidXRef(error_msg)
try:
(start, nobjs) = map(int, f)
except ValueError:
error_msg = "Invalid line: {!r}: line={!r}".format(parser, line)
error_msg = f"Invalid line: {parser!r}: line={line!r}"
raise PDFNoValidXRef(error_msg)
for objid in range(start, start + nobjs):
try:
Expand Down Expand Up @@ -833,7 +833,7 @@ def _getobj_parse(self, pos: int, objid: int) -> object:
objid1 = x[-2]
# #### end hack around malformed pdf files
if objid1 != objid:
raise PDFSyntaxError("objid mismatch: {!r}={!r}".format(objid1, objid))
raise PDFSyntaxError(f"objid mismatch: {objid1!r}={objid!r}")

if kwd != KWD(b"obj"):
raise PDFSyntaxError("Invalid object spec: offset=%r" % pos)
Expand Down
2 changes: 1 addition & 1 deletion pdfminer/pdffont.py
Original file line number Diff line number Diff line change
Expand Up @@ -1063,7 +1063,7 @@ def __init__(
cid_ordering = resolve1(self.cidsysteminfo.get("Ordering", b"unknown")).decode(
"latin1"
)
self.cidcoding = "{}-{}".format(cid_registry.strip(), cid_ordering.strip())
self.cidcoding = f"{cid_registry.strip()}-{cid_ordering.strip()}"
self.cmap: CMapBase = self.get_cmap_from_spec(spec, strict)

try:
Expand Down
2 changes: 1 addition & 1 deletion pdfminer/pdfinterp.py
Original file line number Diff line number Diff line change
Expand Up @@ -320,7 +320,7 @@ def do_keyword(self, pos: int, token: PSKeyword) -> None:
try:
(_, objs) = self.end_type("inline")
if len(objs) % 2 != 0:
error_msg = "Invalid dictionary construct: {!r}".format(objs)
error_msg = f"Invalid dictionary construct: {objs!r}"
raise PSTypeError(error_msg)
d = {literal_name(k): v for (k, v) in choplist(2, objs)}
(pos, data) = self.get_inline_data(pos + len(b"ID "))
Expand Down
29 changes: 12 additions & 17 deletions pdfminer/pdftypes.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,25 +44,20 @@
LITERALS_JPX_DECODE = (LIT("JPXDecode"),)


if sys.version_info >= (3, 8):
from typing import Protocol
from typing import Protocol

class DecipherCallable(Protocol):
"""Fully typed a decipher callback, with optional parameter."""
class DecipherCallable(Protocol):
"""Fully typed a decipher callback, with optional parameter."""

def __call__(
self,
objid: int,
genno: int,
data: bytes,
attrs: Optional[Dict[str, Any]] = None,
) -> bytes:
raise NotImplementedError

else: # Fallback for older Python
from typing import Callable
def __call__(
self,
objid: int,
genno: int,
data: bytes,
attrs: Optional[Dict[str, Any]] = None,
) -> bytes:
raise NotImplementedError

DecipherCallable = Callable[..., bytes]


class PDFObject(PSObject):
Expand Down Expand Up @@ -333,7 +328,7 @@ def decode(self) -> None:

except zlib.error as e:
if settings.STRICT:
error_msg = "Invalid zlib bytes: {!r}, {!r}".format(e, data)
error_msg = f"Invalid zlib bytes: {e!r}, {data!r}"
raise PDFException(error_msg)

try:
Expand Down
4 changes: 2 additions & 2 deletions pdfminer/psparser.py
Original file line number Diff line number Diff line change
Expand Up @@ -132,7 +132,7 @@ def intern(self, name: PSLiteral.NameType) -> _SymbolT:
def literal_name(x: object) -> Any:
if not isinstance(x, PSLiteral):
if settings.STRICT:
raise PSTypeError("Literal required: {!r}".format(x))
raise PSTypeError(f"Literal required: {x!r}")
else:
name = x
else:
Expand Down Expand Up @@ -592,7 +592,7 @@ def start_type(self, pos: int, type: str) -> None:

def end_type(self, type: str) -> Tuple[int, List[PSStackType[ExtraT]]]:
if self.curtype != type:
raise PSTypeError("Type mismatch: {!r} != {!r}".format(self.curtype, type))
raise PSTypeError(f"Type mismatch: {self.curtype!r} != {type!r}")
objs = [obj for (_, obj) in self.curstack]
(pos, self.curtype, self.curstack) = self.context.pop()
log.debug("end_type: pos=%r, type=%r, objs=%r", pos, type, objs)
Expand Down
8 changes: 4 additions & 4 deletions pdfminer/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@
AnyIO = Union[TextIO, BinaryIO]


class open_filename(object):
class open_filename:
"""
Context manager that allows opening a filename
(str or pathlib.PurePath type is supported) and closes it on exit,
Expand Down Expand Up @@ -89,7 +89,7 @@ def shorten_str(s: str, size: int) -> str:
return s[:size]
if len(s) > size:
length = (size - 5) // 2
return "{} ... {}".format(s[:length], s[-length:])
return f"{s[:length]} ... {s[-length:]}"
else:
return s

Expand Down Expand Up @@ -643,12 +643,12 @@ def enc(x: str) -> str:

def bbox2str(bbox: Rect) -> str:
(x0, y0, x1, y1) = bbox
return "{:.3f},{:.3f},{:.3f},{:.3f}".format(x0, y0, x1, y1)
return f"{x0:.3f},{y0:.3f},{x1:.3f},{y1:.3f}"


def matrix2str(m: Matrix) -> str:
(a, b, c, d, e, f) = m
return "[{:.2f},{:.2f},{:.2f},{:.2f}, ({:.2f},{:.2f})]".format(a, b, c, d, e, f)
return f"[{a:.2f},{b:.2f},{c:.2f},{d:.2f}, ({e:.2f},{f:.2f})]"


def vecBetweenBoxes(obj1: "LTComponent", obj2: "LTComponent") -> Point:
Expand Down
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
from setuptools import setup

root_dir = Path(__file__).parent
with open(root_dir / "README.md", "rt") as f:
with open(root_dir / "README.md") as f:
readme = f.read()

setup(
Expand Down
2 changes: 1 addition & 1 deletion tests/test_pdfdocument.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
from tests.helpers import absolute_sample_path


class TestPdfDocument(object):
class TestPdfDocument:
def test_get_zero_objid_raises_pdfobjectnotfound(self):
with open(absolute_sample_path("simple1.pdf"), "rb") as in_file:
parser = PDFParser(in_file)
Expand Down
2 changes: 1 addition & 1 deletion tests/test_pdfpage.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@
from tests.helpers import absolute_sample_path


class TestPdfPage(object):
class TestPdfPage:
def test_page_labels(self):
path = absolute_sample_path("contrib/pagelabels.pdf")
expected_labels = ["iii", "iv", "1", "2", "1"]
Expand Down
4 changes: 2 additions & 2 deletions tests/test_tools_dumppdf.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@ def run(filename, options=None):
absolute_path = absolute_sample_path(filename)
with TemporaryFilePath() as output_file_name:
if options:
s = "dumppdf -o %s %s %s" % (output_file_name, options, absolute_path)
s = "dumppdf -o {} {} {}".format(output_file_name, options, absolute_path)
else:
s = "dumppdf -o %s %s" % (output_file_name, absolute_path)
s = "dumppdf -o {} {}".format(output_file_name, absolute_path)

dumppdf.main(s.split(" ")[1:])

Expand Down
4 changes: 2 additions & 2 deletions tests/test_tools_pdf2txt.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,9 +12,9 @@ def run(sample_path, options=None):
absolute_path = absolute_sample_path(sample_path)
with TemporaryFilePath() as output_file_name:
if options:
s = "pdf2txt -o{} {} {}".format(output_file_name, options, absolute_path)
s = f"pdf2txt -o{output_file_name} {options} {absolute_path}"
else:
s = "pdf2txt -o{} {}".format(output_file_name, absolute_path)
s = f"pdf2txt -o{output_file_name} {absolute_path}"

pdf2txt.main(s.split(" ")[1:])

Expand Down
2 changes: 1 addition & 1 deletion tests/test_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -71,7 +71,7 @@ def given_plane_with_one_object(object_size=50, gridsize=50):
return plane, obj


class TestFunctions(object):
class TestFunctions:
def test_shorten_str(self):
s = shorten_str("Hello there World", 15)
assert s == "Hello ... World"
Expand Down
2 changes: 1 addition & 1 deletion tools/conv_afm.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ def main(argv):
print("# -*- python -*-")
print("FONT_METRICS = {")
for (fontname, (props, chars)) in fonts.items():
print(" {!r}: {!r},".format(fontname, (props, chars)))
print(f" {fontname!r}: {(props, chars)!r},")
print("}")
return 0

Expand Down
6 changes: 3 additions & 3 deletions tools/dumppdf.py
Original file line number Diff line number Diff line change
Expand Up @@ -186,7 +186,7 @@ def resolve_dest(dest: object) -> Any:
dest = resolve_dest(action["D"])
pageno = pages[dest[0].objid]
s = escape(title)
outfp.write('<outline level="{!r}" title="{}">\n'.format(level, s))
outfp.write(f'<outline level="{level!r}" title="{s}">\n')
if dest is not None:
outfp.write("<dest>")
dumpxml(outfp, dest)
Expand Down Expand Up @@ -224,7 +224,7 @@ def extract1(objid: int, obj: Dict[str, Any]) -> None:
)
path = os.path.join(extractdir, "%.6d-%s" % (objid, filename))
if os.path.exists(path):
raise IOError("file exists: %r" % path)
raise OSError("file exists: %r" % path)
print("extracting: %r" % path)
os.makedirs(os.path.dirname(path), exist_ok=True)
out = open(path, "wb")
Expand Down Expand Up @@ -300,7 +300,7 @@ def create_parser() -> ArgumentParser:
"--version",
"-v",
action="version",
version="pdfminer.six v{}".format(pdfminer.__version__),
version=f"pdfminer.six v{pdfminer.__version__}",
)
parser.add_argument(
"--debug",
Expand Down
4 changes: 2 additions & 2 deletions tools/pdf2txt.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@ def float_or_disabled(x: str) -> Optional[float]:
try:
return float(x)
except ValueError:
raise argparse.ArgumentTypeError("invalid float value: {}".format(x))
raise argparse.ArgumentTypeError(f"invalid float value: {x}")


def extract_text(
Expand Down Expand Up @@ -77,7 +77,7 @@ def create_parser() -> argparse.ArgumentParser:
"--version",
"-v",
action="version",
version="pdfminer.six v{}".format(pdfminer.__version__),
version=f"pdfminer.six v{pdfminer.__version__}",
)
parser.add_argument(
"--debug",
Expand Down
Loading