Skip to content

Commit 9533683

Browse files
committed
fix: invalid imports
1 parent 4cc4b2a commit 9533683

2 files changed

Lines changed: 0 additions & 6 deletions

File tree

grobid_client/format/TEI2LossyJSON.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -875,8 +875,6 @@ def get_refs_with_offsets(element):
875875
def _clean_text(text: str) -> str:
876876
if not text:
877877
return ""
878-
import re
879-
import html
880878
text = re.sub(r'\s+', ' ', text.strip())
881879
text = html.unescape(text)
882880
return text
@@ -961,8 +959,6 @@ def get_formatted_passage(head_paragraph, head_section, paragraph_id, element):
961959
def _clean_text_local(text: str) -> str:
962960
if not text:
963961
return ""
964-
import re
965-
import html
966962
text = re.sub(r'\s+', ' ', text.strip())
967963
text = html.unescape(text)
968964
return text

grobid_client/format/TEI2Markdown.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -648,8 +648,6 @@ def _extract_urls(self, bibl_struct: Tag, bib_data: dict) -> None:
648648

649649
def _extract_year(self, date_text: str) -> str:
650650
"""Extract year from date text, handling various formats."""
651-
import re
652-
653651
# Look for 4-digit year patterns
654652
year_match = re.search(r'\b(19|20)\d{2}\b', date_text)
655653
if year_match:

0 commit comments

Comments
 (0)