develooper Front page | perl.perl5.changes | Postings from December 2002

Change 18266: Re: [perl #18107] lc(), uc() and ucfirst() broken inside utf8 regex

From:
hv
Date:
December 8, 2002 17:15
Subject:
Change 18266: Re: [perl #18107] lc(), uc() and ucfirst() broken inside utf8 regex
Message ID:
200212090115.gB91F6p09185@smtp3.ActiveState.com
Change 18266 by hv@hv-crypt.org on 2002/12/09 00:02:57

	Subject: Re: [perl #18107] lc(), uc() and ucfirst() broken inside utf8 regex
	From: Abhijit Menon-Sen <ams@wiw.org>
	Date: Wed, 6 Nov 2002 19:38:11 +0530
	Message-ID: <20021106193811.E20858@lustre.dyn.wiw.org>

Affected files ...

.... //depot/perl/regcomp.c#314 edit
.... //depot/perl/t/op/lc.t#11 edit

Differences ...

==== //depot/perl/regcomp.c#314 (text) ====
Index: perl/regcomp.c
--- perl/regcomp.c#313~18179~	Sun Nov 24 19:06:44 2002
+++ perl/regcomp.c	Sun Dec  8 16:02:57 2002
@@ -5065,6 +5065,23 @@
     SAVEVPTR(PL_reg_curpm);		/* from regexec.c */
     SAVEI32(PL_regnpar);		/* () count. */
     SAVEI32(PL_regsize);		/* from regexec.c */
+
+    {
+	/* Save $1..$n (#18107: UTF-8 s/(\w+)/uc($1)/e); AMS 20021106. */
+	int i;
+	GV *mgv;
+	REGEXP *rx;
+	char digits[16];
+
+	if (PL_curpm && (rx = PM_GETRE(PL_curpm))) {
+	    for (i = 1; i <= rx->nparens; i++) {
+		sprintf(digits, "%lu", i);
+		if ((mgv = gv_fetchpv(digits, FALSE, SVt_PV)))
+		    save_scalar(mgv);
+	    }
+	}
+    }
+
 #ifdef DEBUGGING
     SAVEPPTR(PL_reg_starttry);		/* from regexec.c */
 #endif

==== //depot/perl/t/op/lc.t#11 (text) ====
Index: perl/t/op/lc.t
--- perl/t/op/lc.t#10~14667~	Tue Feb 12 17:33:01 2002
+++ perl/t/op/lc.t	Sun Dec  8 16:02:57 2002
@@ -1,6 +1,6 @@
 #!./perl
 
-print "1..51\n";
+print "1..55\n";
 
 my $test = 1;
 
@@ -136,3 +136,18 @@
 ok(uc("\x{1C5}") eq "\x{1C4}",      "U+01C5 uc is U+01C4");
 ok(uc("\x{1C6}") eq "\x{1C4}",      "U+01C6 uc is U+01C4, too");
 
+# #18107: A host of bugs involving [ul]c{,first}. AMS 20021106
+$a = "\x{3c3}foo.bar"; # \x{3c3} == GREEK SMALL LETTER SIGMA.
+$b = "\x{3a3}FOO.BAR"; # \x{3a3} == GREEK CAPITAL LETTER SIGMA.
+
+($c = $b) =~ s/(\w+)/lc($1)/ge;
+ok($c eq $a, "Using s///e to change case.");
+
+($c = $a) =~ s/(\w+)/uc($1)/ge;
+ok($c eq $b, "Using s///e to change case.");
+
+($c = $b) =~ s/(\w+)/lcfirst($1)/ge;
+ok($c eq "\x{3c3}FOO.bAR", "Using s///e to change case.");
+
+($c = $a) =~ s/(\w+)/ucfirst($1)/ge;
+ok($c eq "\x{3a3}foo.Bar", "Using s///e to change case.");
End of Patch.




nntp.perl.org: Perl Programming lists via nntp and http.
Comments to Ask Bjørn Hansen at ask@perl.org | Group listing | About