diff --git a/src/basic/string.py b/src/basic/string.py index c69b706..eb5b4c1 100644 --- a/src/basic/string.py +++ b/src/basic/string.py @@ -38,6 +38,7 @@ def extract_alphanumeric(s: str) -> str: >>> extract_alphanumeric("こんにちは123ABCワールド") '123ABC' """ + # isalnum() alone would include Unicode alphanumeric characters (like '12345' or 'ABCDE') # isascii() ensures we only get ASCII characters (0-127), # excluding Unicode characters like Japanese, Emoji, etc. return "".join(c for c in s if c.isascii() and c.isalnum())