forked from justmarkham/DAT4
-
Notifications
You must be signed in to change notification settings - Fork 0
/
03_re_example.py
46 lines (34 loc) · 1.47 KB
/
03_re_example.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
"""
This is an intro to regular expressions
I use https://regex101.com/#python to check my work!
"""
import re
# flow:
# create a re pattern object
# search (or match) it against text
# orgnize the captures patterns in groups
# \d matches a number
text = "Hello! My name is Sinan. It is 2014 and it's amazing."
pattern1 = re.compile("\d")
re.search(pattern1, text) # == a search object
# use group to get each instance in the regular expression
# \d is just ONE number, so it only finds the "2" in "2014"
re.search(pattern1, text).group(0)
# adding a + means "at least one" but potentially more
pattern2 = re.compile("\d+")
re.search(pattern2, text).group(0) # == '2014'
# use square brackets [] to match one of the items present
alphabet = 'abcdefg'
pattern3 = re.compile('[cfg]')
re.search(pattern3, alphabet).group(0)
mystery_pattern = re.compile("\d+-\d+-\d+")
# take a few minutes, and discuss, what application could this mystery_pattern have
re.search(mystery_pattern, "my phone number is 609-462-6706 dude").group(0)
# . matches ANYTHING
all_of_the_text = "dmzhvbekuhvbc dfljghwco87rc6geinsr6t4gi7rgwefiuvbekuhvbdfljghwco87rc6geinsr6t4gi7rgwefiu ywgsfybcstzvgbrtybte"
anything_pattern = re.compile(".+")
re.search(anything_pattern, all_of_the_text).group(0)
# \w matches any word character, alphanumeric
# if you want to match an actual period, do \.
email_pattern = re.compile("[\w\.]+@\w+\.com")
re.search(email_pattern, "my email address is [email protected]").group(0)