From e486c5061088197b2964e09b7f144912cf8bb693 Mon Sep 17 00:00:00 2001 From: Mike J Innes Date: Wed, 20 Jun 2018 14:44:16 +0100 Subject: [PATCH] fix data --- src/data/cmudict.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/data/cmudict.jl b/src/data/cmudict.jl index 2a26b691..b3257734 100644 --- a/src/data/cmudict.jl +++ b/src/data/cmudict.jl @@ -40,7 +40,7 @@ function rawdict() filter(!isempty, split.(split(readstring(deps("cmudict", "cmudict")), "\n")))) end -validword(s) = ismatch(r"^[\w\-\.]+$", s) +validword(s) = isascii(s) && ismatch(r"^[\w\-\.]+$", s) cmudict() = filter((s, ps) -> validword(s), rawdict())