Regex Flashcards
Learn Regex syntax
import re
str = “The rain in Spain will rain.”
x = re.findall(“rain”, str)
print(x)
[‘rain’, ‘rain’]
import re
str = “The rain in Spain will rain.”
x = re.findall(“rain|Spain”, str)
print(x)
[‘rain’, ‘Spain’, ‘rain’]
import re
str = “The rain in Spain will rain.”
x = re.findall(“^rain|Spain”, str)
print(x)
[‘Spain’]
import re
print(re.findall(“al{2}”, “fall”))
print(re.findall(“al{3}”, “fall”))
print(re.findall(“tal{2}”, “fall”))
[‘all’]
[]
[]
import re
str = “alll aboard the pain train”
x = re.search(“aboard”, str)
print(x.span())
(5, 11)
import re
str = “alll aboard the pain train”
x = re.search(“aboard”, str)
print(x.string)
#the .string gives you everything alll aboard the pain train
import re
print(re.findall(“[arn]”, “rainy”))
print(re.findall(“[^arn]”, “rainy”))
print(re.findall(“^[arn]”, “rainy”))
[‘r’, ‘a’, ‘n’]
[‘i’, ‘y’]
[‘r’]
import re
str = “rainy”
x = re.findall(“[arn]”, str)
print(x)
[‘r’, ‘a’, ‘n’]
import re
str = “8 times before 11:45 AM”
x = re.findall(“[0-5][0-9]”, str)
print(x)
#Returns anything with digits between 00 and 59 ['11', '45']
import re
str = “The rain in Spain”
x = re.findall(“\W”, str)
print(x)
#\W returns all non word characters, like white space [' ', ' ', ' ']
import re
str = “The rain in Spain”
x = re.findall(“\ASpain”, str)
print(x)
#\A checks if the string starts with something []
import re
print(re.findall(“a…s$”, “abs”))
print(re.findall(“a…s$”, “alias”))
print(re.findall(“a…s$”, “abyss”))
print(re.findall(“a…s$”, “abacus”))
#Three periods means three characters that aren't newline [] ['alias'] ['abyss'] []
import re
str = “a aabc daaaat”
x = re.findall(“a{2,3}”, str)
print(x)
#At least 2, at most 3 ['aa', 'aaa']
import re
print(re.findall("ma*n", "mn")) print(re.findall("ma*n", "man")) print(re.findall("ma*n", "maaan")) print(re.findall("ma*n", "main")) print(re.findall("ma*n", "woman"))
#* means zero or more occurrences of the a ['mn'] ['man'] ['maaan'] [] ['man']
import re
print(re.findall("ma+n", "mn")) print(re.findall("ma+n", "man")) print(re.findall("ma+n", "maaan")) print(re.findall("ma+n", "main")) print(re.findall("ma+n", "woman"))
#+ means 1 or more occurrences of the a [] ['man'] ['maaan'] [] ['man']
import re
print(re.findall("ma?n", "mn")) print(re.findall("ma?n", "man")) print(re.findall("ma?n", "maaan")) print(re.findall("ma?n", "main")) print(re.findall("ma?n", "woman"))
#? means zero or 1 occurrence of the a ['mn'] ['man'] [] [] ['man']
import re
print(re.findall(r”\bfoo”,”football”))
print(re.findall(r”\bfoo”,”a football”))
print(re.findall(r”\bfoo”,”afootball”))
checks for foo at the beginning of words
[‘foo’]
[‘foo’]
[]
import re
print(re.findall(r”foo\b”,”the foo”))
print(re.findall(r”foo\b”,”the afoo test”))
print(re.findall(r”foo\b”,”the afootest”))
checks for foo at the end of words
[‘foo’]
[‘foo’]
[]
import re
print(re.findall(r”\Bfoo”,”football”))
print(re.findall(r”\Bfoo”,”a football”))
print(re.findall(r”\Bfoo”,”afootball”))
makes sure foo is present, but NOT at the beginning of a word
[]
[]
[‘foo’]
import re
print(re.findall(r”foo\B”,”the foo”))
print(re.findall(r”foo\B”,”the afoo test”))
print(re.findall(r”foo\B”,”the afootest”))
makes sure foo is present, but NOT at the end of a word
[]
[]
[‘foo’]
import re
print(re.findall(“\d”,”12a!bc3”))
print(re.findall(“\d”,”Pyth@n”))
\d makes a match for all digits
[‘1’, ‘2’, ‘3’]
[]
import re
print(re.findall(“\D”,”1a!b34’5”))
print(re.findall(“\D”,”1345”))
\D makes a match for all non-digits
[‘a’, ‘!’, ‘b’, “’”]
[]
import re
print(re.findall(“\s”,”Python”))
print(re.findall(“\s”,”Python yo”))
Returns whitespace
[]
[’ ‘]
import re
print(re.findall(“\S”,”a b”))
print(re.findall(“\s”,” “))
\S returns everything that isn’t whitespace
#\s returns whitespace
[‘a’, ‘b’]
[’ ‘]
import re
print(re.findall(“\w”,”12&’: ;c”))
print(re.findall(“\w”,”’%> !”))
Returns all alphanumeric characters
[‘1’, ‘2’, ‘c’]
[]
import re
print(re.findall(“\W”,”1a2%c”))
print(re.findall(“\W”,”’%> !”))
Returns all non-alphanumeric characters
[’%’]
[”’”, ‘%’, ‘>’, ‘ ‘, ‘!’]
import re
print(re.findall(“Python\Z”,”I like Python”))
print(re.findall(“Python\Z”,”I like python”))
print(re.findall(“Python\Z”,”Python is fun”))
Returns ‘Python’ if the string ends with it
[‘Python’]
[]
[]