diff --git a/provider/datagen/data/segmenter/grapheme.toml b/provider/datagen/data/segmenter/grapheme.toml index ea20e6ccfcd..6744e9b3e5a 100644 --- a/provider/datagen/data/segmenter/grapheme.toml +++ b/provider/datagen/data/segmenter/grapheme.toml @@ -2,8 +2,8 @@ # called LICENSE at the top level of the ICU4X source tree # (online at: https://github.com/unicode-org/icu4x/blob/main/LICENSE ). -# These grapheme boundary rules are based on UAX #29, Unicode Version 15.0.0. -# https://www.unicode.org/reports/tr29/tr29-41.html +# These grapheme boundary rules are based on UAX #29, Unicode Version 15.1.0. +# https://www.unicode.org/reports/tr29/tr29-43.html segmenter_type = "grapheme" diff --git a/provider/datagen/data/segmenter/sentence.toml b/provider/datagen/data/segmenter/sentence.toml index d04d2b2d548..28ab1696182 100644 --- a/provider/datagen/data/segmenter/sentence.toml +++ b/provider/datagen/data/segmenter/sentence.toml @@ -2,8 +2,8 @@ # called LICENSE at the top level of the ICU4X source tree # (online at: https://github.com/unicode-org/icu4x/blob/main/LICENSE ). -# These sentence boundary rules are based on UAX #29, Unicode Version 15.0.0. -# https://www.unicode.org/reports/tr29/tr29-41.html +# These sentence boundary rules are based on UAX #29, Unicode Version 15.1.0. +# https://www.unicode.org/reports/tr29/tr29-43.html segmenter_type = "sentence"