In [1]:
import re
In [2]:
# Dot (.): Matches any character except a newline.
pattern = r"."
match = re.findall(pattern, "Hello\nWorld")
print(match)
[''''H'''', ''''e'''', ''''l'''', ''''l'''', ''''o'''', ''''W'''', ''''o'''', ''''r'''', ''''l'''', ''''d'''']
In [3]:
# Caret (^): Matches the start of a string
pattern = r"^Hello"
match = re.findall(pattern, "Hello World")
print(match)
[''''Hello'''']
In [4]:
# Dollar ($): Matches the end of a string
pattern = r"World$"
match = re.findall(pattern, "Hello World")
print(match)
[''''World'''']
In [5]:
# Asterisk (*): Matches 0 or more repetitions of the preceding
pattern = r"a*"
match = re.findall(pattern, "aaaab")
print(match)
[''''aaaa'''', '''''''', '''''''']
In [6]:
# Plus (+): Matches 1 or more repetitions of the preceding character
pattern = r"a+"
match = re.findall(pattern, "aaaab")
print(match)
[''''aaaa'''']
In [7]:
# Question Mark (?): Matches 0 or 1 repetition of the preceding
pattern = r"ab?"
match = re.findall(pattern, "a ab abb")
print(match)
[''''a'''', ''''ab'''', ''''ab'''']
In [8]:
# Braces ({}): Matches a specified number of repetitions of the preceding character
pattern = r"a{2,3}"
match = re.findall(pattern, "a aa aaa aaaa")
print(match)
[''''aa'''', ''''aaa'''', ''''aaa'''']
In [9]:
# Square Brackets ([]): Matches any one of the characters inside the brackets
pattern = r"[aeiou]"
match = re.findall(pattern, "Hello World")
print(match)
[''''e'''', ''''o'''', ''''o'''']
In [10]:
# Backslash (\): Escapes special characters or denotes special sequences
pattern = r"\d"
match = re.findall(pattern, "There are 2 apples")
print(match)
[''''2'''']
\d: Matches any digit (equivalent to [0-9]).
\D: Matches any non-digit (equivalent to [^0-9]).
\w: Matches any alphanumeric character (equivalent to [a-zA-Z0-9_]).
\W: Matches any non-alphanumeric character (equivalent to [^a-zA-Z0-9_]).
\s: Matches any whitespace character (equivalent to [ \t\n\r\f\v]).
\S: Matches any non-whitespace character (equivalent to [^ \t\n\r\f\v]).
In [11]:
import re
text = "The price is $123.45 on 2024-10-07."
pattern = r"\$\d+\.\d{2}"
matches = re.findall(pattern, text)
print(matches)
pattern = r"\d{4}-\d{2}-\d{2}"
matches = re.findall(pattern, text)
print(matches)
[''''$123.45''''] [''''2024-10-07'''']