From a8ba1ddd78544b4bda749051d44f7b2a8a0ec5ff Mon Sep 17 00:00:00 2001 From: Jeremy Evans Date: Fri, 24 Mar 2023 11:53:53 -0700 Subject: Use UTF-8 encoding for literal extended regexps with UTF-8 characters in comments Fixes [Bug #19455] --- test/ruby/test_regexp.rb | 7 +++++++ 1 file changed, 7 insertions(+) (limited to 'test') diff --git a/test/ruby/test_regexp.rb b/test/ruby/test_regexp.rb index f10d5f3077..d04b9cf766 100644 --- a/test/ruby/test_regexp.rb +++ b/test/ruby/test_regexp.rb @@ -187,6 +187,13 @@ class TestRegexp < Test::Unit::TestCase RUBY end + def test_utf8_comment_in_usascii_extended_regexp_bug_19455 + assert_separately([], <<-RUBY) + assert_equal(Encoding::UTF_8, /(?#\u1000)/x.encoding) + assert_equal(Encoding::UTF_8, /#\u1000/x.encoding) + RUBY + end + def test_union assert_equal :ok, begin Regexp.union( -- cgit v1.2.1