RustPython · youknowone · Apr 14, 2026 · Apr 12, 2026 · Apr 13, 2026 · ShaharNaveh
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/crates/vm/src/anystr.rs b/crates/vm/src/anystr.rs
@@ -4,6 +4,10 @@ use crate::{
     convert::TryFromBorrowedObject,
     function::OptionalOption,
 };
+use icu_properties::{
+    CodePointSetData,
+    props::{Alphabetic, ChangesWhenLowercased, ChangesWhenUppercased},
+};
 use num_traits::{cast::ToPrimitive, sign::Signed};
 
 use core::ops::Range;
@@ -130,8 +134,6 @@ where
 }
 
 pub trait AnyChar: Copy {
-    fn is_lowercase(self) -> bool;
-    fn is_uppercase(self) -> bool;
     fn bytes_len(self) -> usize;
 }
 
@@ -407,12 +409,16 @@ pub trait AnyStr {
     //  _Py_bytes_islower
     //  unicode_islower_impl
     fn py_islower(&self) -> bool {
+        let case_change = CodePointSetData::new::<ChangesWhenLowercased>();
+        let alphabetic = CodePointSetData::new::<Alphabetic>();
         let mut lower = false;
-        for c in self.elements() {
-            if c.is_uppercase() {
+        for chunk in self.as_bytes().utf8_chunks().map(|c| c.valid()) {
+            if chunk.chars().any(|c| case_change.contains(c)) {
                 return false;
-            } else if !lower && c.is_lowercase() {
-                lower = true
+            }
+
+            if !lower && chunk.chars().any(|c| alphabetic.contains(c)) {
+                lower = true;
             }
         }
         lower
@@ -422,12 +428,16 @@ pub trait AnyStr {
     //   Py_bytes_isupper
     //  unicode_isupper_impl
     fn py_isupper(&self) -> bool {
+        let case_change = CodePointSetData::new::<ChangesWhenUppercased>();
+        let alphabetic = CodePointSetData::new::<Alphabetic>();
         let mut upper = false;
-        for c in self.elements() {
-            if c.is_lowercase() {
+        for chunk in self.as_bytes().utf8_chunks().map(|c| c.valid()) {
+            if chunk.chars().any(|c| case_change.contains(c)) {
                 return false;
-            } else if !upper && c.is_uppercase() {
-                upper = true
+            }
+
+            if !upper && chunk.chars().any(|c| alphabetic.contains(c)) {
+                upper = true;
             }
         }
         upper

diff --git a/crates/vm/src/builtins/str.rs b/crates/vm/src/builtins/str.rs
@@ -2228,14 +2228,6 @@ impl AnyStrContainer<str> for String {
 }
 
 impl anystr::AnyChar for char {
-    fn is_lowercase(self) -> bool {
-        self.is_lowercase()
-    }
-
-    fn is_uppercase(self) -> bool {
-        self.is_uppercase()
-    }
-
     fn bytes_len(self) -> usize {
         self.len_utf8()
     }
@@ -2341,12 +2333,6 @@ impl AnyStrContainer<Wtf8> for Wtf8Buf {
 }
 
 impl anystr::AnyChar for CodePoint {
-    fn is_lowercase(self) -> bool {
-        self.is_char_and(char::is_lowercase)
-    }
-    fn is_uppercase(self) -> bool {
-        self.is_char_and(char::is_uppercase)
-    }
     fn bytes_len(self) -> usize {
         self.len_wtf8()
     }
@@ -2459,14 +2445,6 @@ impl AnyStrContainer<AsciiStr> for AsciiString {
 }
 
 impl anystr::AnyChar for ascii::AsciiChar {
-    fn is_lowercase(self) -> bool {
-        self.is_lowercase()
-    }
-
-    fn is_uppercase(self) -> bool {
-        self.is_uppercase()
-    }
-
     fn bytes_len(self) -> usize {
         1
     }

diff --git a/crates/vm/src/bytes_inner.rs b/crates/vm/src/bytes_inner.rs
@@ -1031,14 +1031,6 @@ impl AnyStrContainer<[u8]> for Vec<u8> {
 const ASCII_WHITESPACES: [u8; 6] = [0x20, 0x09, 0x0a, 0x0c, 0x0d, 0x0b];
 
 impl anystr::AnyChar for u8 {
-    fn is_lowercase(self) -> bool {
-        self.is_ascii_lowercase()
-    }
-
-    fn is_uppercase(self) -> bool {
-        self.is_ascii_uppercase()
-    }
-
     fn bytes_len(self) -> usize {
         1
     }

diff --git a/extra_tests/snippets/builtin_str.py b/extra_tests/snippets/builtin_str.py
@@ -69,6 +69,8 @@
 assert not a.isdecimal()
 assert not a.isnumeric()
 assert a.istitle()
+assert "\u1c89".istitle()
+# assert "Ǳ".title() == "ǲ"
 assert a.isalpha()
 
 s = "1 2 3"
@@ -220,6 +222,14 @@
 assert "abc\t12345\txyz".expandtabs() == "abc     12345   xyz"
 assert "-".join(["1", "2", "3"]) == "1-2-3"
 assert "HALLO".isupper()
+assert not "123".isupper()
+assert not "123".islower()
+assert not "\U0001f431".isupper()
+assert not "\U0001f431".islower()
+assert "\U0001f431 CAT".isupper()
+assert "\U0001f431 cat".islower()
+assert "\u0295".islower()
+assert "\u1c89".isupper()
 assert "hello, my name is".partition("my ") == ("hello, ", "my ", "name is")
 assert "hello".partition("is") == ("hello", "", "")
 assert "hello, my name is".rpartition("is") == ("hello, my name ", "is", "")
@@ -236,6 +246,8 @@
 assert not "123".isidentifier()
 
 assert "Σίσυφος".swapcase() == "σΊΣΥΦΟΣ"
+assert "\u0295".swapcase() == "\u0295"
+assert "\u1c89".swapcase() == "\u1c8a"
 
 # String Formatting
 assert "{} {}".format(1, 2) == "1 2"