Lib.test.test_re_jy.py Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jython-standalone Show documentation
Show all versions of jython-standalone Show documentation
Jython is an implementation of the high-level, dynamic, object-oriented
language Python written in 100% Pure Java, and seamlessly integrated with
the Java platform. It thus allows you to run Python on any Java platform.
import re
import sys
import unittest
import test.test_support
import unicodedata
from unicodedata import category
class ReTest(unittest.TestCase):
def test_bug_1140_addendum(self):
result = re.sub('', lambda match : None, 'foo')
self.assertEqual(result, 'foo')
self.assert_(isinstance(result, str))
def test_sub_with_subclasses(self):
class Foo(unicode):
def join(self, items):
return Foo(unicode.join(self, items))
result = re.sub('bar', 'baz', Foo('bar'))
self.assertEqual(result, u'baz')
self.assertEqual(type(result), unicode)
class Foo2(unicode):
def join(self, items):
return Foo2(unicode.join(self, items))
def __getslice__(self, start, stop):
return Foo2(unicode.__getslice__(self, start, stop))
result = re.sub('bar', 'baz', Foo2('bar'))
self.assertEqual(result, Foo2('baz'))
self.assert_(isinstance(result, Foo2))
def test_unkown_groupname(self):
self.assertRaises(IndexError,
re.match(r'(?P\d+)\.(\d*)', '3.14').group,
'misspelled')
def test_whitespace(self):
# Test for http://bugs.jython.org/issue2226 - verify against cpython
ws_re = re.compile(r'\s')
not_ws_re = re.compile(r'\S')
cpython_ascii_whitespace = set(' \t\n\r\f\v')
for i in xrange(256):
c = chr(i)
if c in cpython_ascii_whitespace:
self.assertRegexpMatches(c, ws_re)
self.assertNotRegexpMatches(c, not_ws_re)
else:
self.assertNotRegexpMatches(c, ws_re)
self.assertRegexpMatches(c, not_ws_re)
def test_unicode_whitespace(self):
# Test for http://bugs.jython.org/issue2226
ws_re = re.compile(r'\s', re.UNICODE)
not_ws_re = re.compile(r'\S', re.UNICODE)
separator_categories = set(['Zl', 'Zp', 'Zs'])
separators = {chr(c) for c in [28, 29, 30, 31]}
special = set([
unicodedata.lookup('MONGOLIAN VOWEL SEPARATOR'),
u'\u0085', # NEXT LINE (NEL)
])
cpython_whitespace = set(' \t\n\r\f\v') | separators | special
for i in xrange(0xFFFF): # could test to sys.maxunicode, but does not appear to be necessary
if i >= 0xD800 and i <= 0xDFFF:
continue
c = unichr(i)
if c in cpython_whitespace or category(c) in separator_categories:
self.assertRegexpMatches(c, ws_re)
self.assertNotRegexpMatches(c, not_ws_re)
else:
self.assertNotRegexpMatches(c, ws_re)
self.assertRegexpMatches(c, not_ws_re)
def test_main():
test.test_support.run_unittest(ReTest)
if __name__ == "__main__":
test_main()