diff --git a/claudini/bench.py b/claudini/bench.py index ef245ff..d08ea68 100644 --- a/claudini/bench.py +++ b/claudini/bench.py @@ -47,7 +47,7 @@ class BenchmarkConfig: input_spec: InputSpec = field(default_factory=InputSpec.default) # Token filtering and final evaluation mode - filter_ascii: bool = True # block non-ASCII / non-printable tokens + filter_ascii: bool = False # block non-ASCII / non-printable tokens filter_special: bool = False # block special / control / added tokens filter_retok: bool = False # decode->re-encode retokenization round-trip filter final_input: str = "tokens" diff --git a/claudini/run_bench.py b/claudini/run_bench.py index d9b95ec..c85c24c 100644 --- a/claudini/run_bench.py +++ b/claudini/run_bench.py @@ -115,7 +115,7 @@ def run_bench( resolved_max_time = preset_cfg.get("max_time", None) # Token filtering - resolved_filter_ascii = preset_cfg.get("filter_ascii", True) + resolved_filter_ascii = preset_cfg.get("filter_ascii", False) resolved_filter_special = preset_cfg.get("filter_special", False) resolved_filter_retok = preset_cfg.get("filter_retok", False) resolved_final_input = preset_cfg.get("final_input", "tokens")