%load_ext watermark %watermark -d -v -u -t -z import re needle = 'needlers' # Python approach print(bool(any([needle.endswith(e) for e in ('ly', 'ed', 'ing', 'ers')]))) # On-the-fly Regular expression in Python print(bool(re.search(r'(?:ly|ed|ing|ers)$', needle))) # Compiled Regular expression in Python comp = re.compile(r'(?:ly|ed|ing|ers)$') print(bool(comp.search(needle))) %timeit -n 10000 -r 50 bool(any([needle.endswith(e) for e in ('ly', 'ed', 'ing', 'ers')])) %timeit -n 10000 -r 50 bool(re.search(r'(?:ly|ed|ing|ers)$', needle)) %timeit -n 10000 -r 50 bool(comp.search(needle)) pattern = r'(?i)(\w+)\.(jpeg|jpg|png|gif|tif|svg)$' # remove `(?i)` to make regexpr case-sensitive str_true = ('test.gif', 'image.jpeg', 'image.jpg', 'image.TIF' ) str_false = ('test.pdf', 'test.gif.pdf', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f min_len = 5 # minimum length for a valid username max_len = 15 # maximum length for a valid username pattern = r"^(?i)[a-z0-9_-]{%s,%s}$" %(min_len, max_len) # remove `(?i)` to only allow lower-case letters str_true = ('user123', '123_user', 'Username') str_false = ('user', 'username1234_is-way-too-long', 'user$34354') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r"(^[a-zA-Z0-9_.+-]+@[a-zA-Z0-9-]+\.[a-zA-Z0-9-.]+$)" str_true = ('test@mail.com',) str_false = ('testmail.com', '@testmail.com', 'test@mailcom') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^(https?:\/\/)?([\da-z\.-]+)\.([a-z\.]{2,6})([\/\w \.-]*)*\/?$' str_true = ('https://github.com', 'http://github.com', 'www.github.com', 'github.com', 'test.de', 'https://github.com/rasbt', 'test.jpeg' # !!! ) str_false = ('testmailcom', 'http:testmailcom', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^\d+$' str_true = ('123', '1', ) str_false = ('abc', '1.1', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^-\d+$' str_true = ('-123', '-1', ) str_false = ('123', '-abc', '-1.1', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^-{0,1}\d+$' str_true = ('-123', '-1', '1', '123',) str_false = ('123.0', '-abc', '-1.1', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^\d*\.{0,1}\d+$' str_true = ('1', '123', '1.234', ) str_false = ('-abc', '-123', '-123.0') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^-\d*\.{0,1}\d+$' str_true = ('-1', '-123', '-123.0', ) str_false = ('-abc', '1', '123', '1.234', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^-{0,1}\d*\.{0,1}\d+$' str_true = ('1', '123', '1.234', '-123', '-123.0') str_false = ('-abc') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = '^(0[1-9]|1[0-2])\/(0[1-9]|1\d|2\d|3[01])\/(19|20)\d{2}$' str_true = ('01/08/2014', '12/30/2014', ) str_false = ('22/08/2014', '-123', '1/8/2014', '1/08/2014', '01/8/2014') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r'^(1[012]|[1-9]):[0-5][0-9](\s)?(?i)(am|pm)$' str_true = ('2:00pm', '7:30 AM', '12:05 am', ) str_false = ('22:00pm', '14:00', '3:12', '03:12pm', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r'^([0-1]{1}[0-9]{1}|20|21|22|23):[0-5]{1}[0-9]{1}$' str_true = ('14:00', '00:30', ) str_false = ('22:00pm', '4:00', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r"""\s]+))?)+\s*|\s*)/?>""" str_true = ('', '', '', '') str_false = ('a>', '') for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r'^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$' str_true = ('', '', '', ) str_false = ('17216.254.1', '', '01 .102.103.104', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r'^\s*((([0-9A-Fa-f]{1,4}:){7}([0-9A-Fa-f]{1,4}|:))|(([0-9A-Fa-f]{1,4}:){6}(:[0-9A-Fa-f]{1,4}|((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3})|:))|(([0-9A-Fa-f]{1,4}:){5}(((:[0-9A-Fa-f]{1,4}){1,2})|:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3})|:))|(([0-9A-Fa-f]{1,4}:){4}(((:[0-9A-Fa-f]{1,4}){1,3})|((:[0-9A-Fa-f]{1,4})?:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3}))|:))|(([0-9A-Fa-f]{1,4}:){3}(((:[0-9A-Fa-f]{1,4}){1,4})|((:[0-9A-Fa-f]{1,4}){0,2}:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3}))|:))|(([0-9A-Fa-f]{1,4}:){2}(((:[0-9A-Fa-f]{1,4}){1,5})|((:[0-9A-Fa-f]{1,4}){0,3}:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3}))|:))|(([0-9A-Fa-f]{1,4}:){1}(((:[0-9A-Fa-f]{1,4}){1,6})|((:[0-9A-Fa-f]{1,4}){0,4}:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3}))|:))|(:(((:[0-9A-Fa-f]{1,4}){1,7})|((:[0-9A-Fa-f]{1,4}){0,5}:((25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)(\.(25[0-5]|2[0-4]\d|1\d\d|[1-9]?\d)){3}))|:)))(%.+)?\s*$' str_true = ('2001:470:9b36:1::2', '2001:cdba:0000:0000:0000:0000:3257:9652', '2001:cdba:0:0:0:0:3257:9652', '2001:cdba::3257:9652', ) str_false = ('1200::AB00:1234::2552:7777:1313', # uses `::` twice '1200:0000:AB00:1234:O000:2552:7777:1313', ) # contains an O instead of 0 for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f pattern = r'^(?i)([0-9A-F]{2}[:-]){5}([0-9A-F]{2})$' str_true = ('94-AE-70-A0-66-83', '58-f8-1a-00-44-c8', '00:A0:C9:14:C8:29' , ) str_false = ('0:00:00:00:00:00', '94-AE-70-A0 -66-83', ) for t in str_true: assert(bool(re.match(pattern, t)) == True), '%s is not True' %t for f in str_false: assert(bool(re.match(pattern, f)) == False), '%s is not False' %f