Skip to content

Commit

Permalink
Allows for caching of UD/German-HDT dataset; increase pct precision
Browse files Browse the repository at this point in the history
  • Loading branch information
gremid committed Nov 26, 2024
1 parent f57d2cc commit 297dea2
Showing 1 changed file with 1 addition and 2 deletions.
3 changes: 1 addition & 2 deletions dwdsmor/build/benchmark.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,6 @@ def ud_de_hdt_tokens():
"universal_dependencies",
"de_hdt",
split="train",
streaming=True,
trust_remote_code=True,
)
for s in sentences:
Expand Down Expand Up @@ -189,7 +188,7 @@ def compute_coverage(automata, limit=None, show_progress=False):
args = arg_parser.parse_args()

def pct(v):
return "{:.2%}".format(v)
return "{:.3%}".format(v)

def count(v):
return "{:,d}".format(v)
Expand Down

0 comments on commit 297dea2

Please sign in to comment.