Skip to content

Commit

Permalink
Fix pydantic validation error in de edition code
Browse files Browse the repository at this point in the history
Page "verständigen" and "dece-septe" has incorrect wikitext, fixed on
de Wiktionary.
  • Loading branch information
xxyzz committed Mar 27, 2024
1 parent 8200ec3 commit 3a14dec
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 11 deletions.
2 changes: 1 addition & 1 deletion src/wiktextract/extractor/de/translation.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ def extract_translation(
)
else:
sense_translations = []
sense_id = level_node_child.template_parameters.get(1, "")
sense_id = str(level_node_child.template_parameters.get(1, ""))
base_translation_data = Translation(sense_id=sense_id)
if sense_id == "":
# XXX: Sense-disambiguate where senseids are in Ü-Liste (ca. 0.03% of pages), e.g.:
Expand Down
15 changes: 5 additions & 10 deletions tests/test_de_page.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,17 +10,12 @@

class TestDEPage(unittest.TestCase):
def setUp(self):
conf1 = WiktionaryConfig(
dump_file_lang_code="de",
capture_language_codes=None,
capture_translations=True,
# capture_pronunciation=True,
# capture_linkages=True,
# capture_compounds=True,
# capture_redirects=True,
# capture_examples=True,
self.wxr = WiktextractContext(
Wtp(lang_code="de"),
WiktionaryConfig(
dump_file_lang_code="de", capture_language_codes=None
),
)
self.wxr = WiktextractContext(Wtp(lang_code="de"), conf1)
self.maxDiff = None

def tearDown(self) -> None:
Expand Down

0 comments on commit 3a14dec

Please sign in to comment.