Skip to content

Commit

Permalink
Fix for issue Unstructured-IO#3815
Browse files Browse the repository at this point in the history
Removed redundent patch as it is already merged in pdfminer/pdfminer.six#885
  • Loading branch information
PhorstenkampFuzzy authored Dec 17, 2024
1 parent 9a9bf4c commit 19509ed
Show file tree
Hide file tree
Showing 3 changed files with 0 additions and 30 deletions.
6 changes: 0 additions & 6 deletions unstructured/partition/pdf.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,6 @@

import numpy as np
import wrapt
from pdfminer import psparser
from pdfminer.layout import LTContainer, LTImage, LTItem, LTTextBox
from pdfminer.utils import open_filename
from pi_heif import register_heif_opener
Expand Down Expand Up @@ -96,16 +95,11 @@
PartitionStrategy,
)
from unstructured.partition.utils.sorting import coord_has_valid_points, sort_page_elements
from unstructured.patches.pdfminer import parse_keyword
from unstructured.utils import first, requires_dependencies

if TYPE_CHECKING:
pass

# NOTE(alan): Patching this to fix a bug in pdfminer.six. Submitted this PR into pdfminer.six to fix
# the bug: https://github.com/pdfminer/pdfminer.six/pull/885
psparser.PSBaseParser._parse_keyword = parse_keyword # type: ignore

RE_MULTISPACE_INCLUDING_NEWLINES = re.compile(pattern=r"\s+", flags=re.DOTALL)


Expand Down
Empty file removed unstructured/patches/__init__.py
Empty file.
24 changes: 0 additions & 24 deletions unstructured/patches/pdfminer.py

This file was deleted.

0 comments on commit 19509ed

Please sign in to comment.