In [2]:
import re

In [3]:
re.findall("abc","xyzabc..abc ABC ")


Out[3]:
['abc', 'abc']

In [5]:
re.findall("1+","11111111 1111")


Out[5]:
['11111111', '1111']

In [6]:
re.findall("ab+","abababa , abb, aba  abababa abbbb ab ")


Out[6]:
['ab', 'ab', 'ab', 'abb', 'ab', 'ab', 'ab', 'ab', 'abbbb', 'ab']

In [7]:
re.findall("a[123]b","a1b a2b, a3bss a123b   axb")


Out[7]:
['a1b', 'a2b', 'a3b']

In [10]:
re.findall("a[^123]b","a1b a2b, a3bss a123b   axb")


Out[10]:
['axb']

In [11]:
re.findall(r'a[\d]b',"a1b a2b, a3bss a123b   axb")


Out[11]:
['a1b', 'a2b', 'a3b']

In [12]:
print(re.findall(r'\d+','123xyz456'))


['123', '456']

In [16]:
print(re.findall(r'\d*xyz','123xyz xyz'))


['123xyz', 'xyz']

In [17]:
print(re.findall(r'\d+\??','12?  12'))


['12?', '12']

In [20]:
print(re.findall(r'\d+xyz','111xyz 123xyz'))


['111xyz', '123xyz']

In [23]:
print(re.findall(r'\d+',"12345"))
print(re.findall(r'\d+?',"12345"))


['12345']
['1', '2', '3', '4', '5']

In [29]:
print(re.findall(r'\d{2,3}?xyz',"123xyz"))
print(re.findall(r'xyz\d{2,3}?',"xyz123"))


['123xyz']
['xyz12']

In [28]:
print(re.findall(r'(\w+?)(\d+)','abc123'))
print(re.findall(r'(\w+?)(\w+)','abc123'))


[('abc', '123')]
[('a', 'bc123')]

In [33]:
print(re.findall(r'<div>(.+?)</div>','<div>title1</div><div>title2</div>')) #非贪婪匹配了


['title1', 'title2']

In [37]:
print(re.findall(r'^\w+','abc123\n12312312123',re.MULTILINE))


['abc123', '12312312123']

In [40]:
print(re.findall(r'((\d*)(a+))', '123a a'))


[('123a', '123', 'a'), ('a', '', 'a')]

In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]:


In [ ]: