Python正则表达式（上）开发者社区

Python正则表达式（上）

import re
input_number = input("请输入一个三位数:")
match = re.match("^\d{3}$",input_number)
if match is None:
    print("不符合要求")
else:
    print("符合要求")

# 步骤一：通过引擎编译出对象
import re
pattern = re.compile(R"[1][345789]\d{9}")   # 编译出pattern对象
input_mobile = input("请输入手机号码:")
# 步骤二：对输入的内容进行匹配
# print(pattern.match(input_mobile))
if pattern.match(input_mobile):
    print("输入的手机号有效！")
else:
    print("输入的手机号无效！")

.   \   |   ^   $   *   +   ?   []   {}   ()

re.match("^a...","avfs")

re.match("^a.{3}","avfs")

print(re.findall("a.{3}","avfssssadddadddaef"))  # 把匹配开头的^去掉了

['avfs', 'addd', 'addd']

import re
print(re.match(R"^\D\s{2}\w$","a  _"))

import re
print(re.findall(R"[a-fA-F][a-z]{3}[02468]","bddf42fbas8"))

print(re.findall(R"na[a-z]*e","my name is Alice,nae,nattore"))

['name', 'nae', 'nattore']

print(re.findall(R"na[a-z]+e","my name is Alice,nae,nattore"))

['name', 'nattore']

print(re.findall(R"na[a-z]?e","my name is Alice,nae,nattore"))

['name', 'nae']

print(re.match(r"(\d{14}[0-9x]|\d{17}[0-9x])","34262320001218646x"))

# 正则表达式匹配以na开头加上4个小写字母并以e结尾：
print(re.findall(R"na[a-z]{4}e","my name is Alice,nae,nattore"))

['nattore']

# 正则表达式匹配以na开头加上3-10个小写字母并以e结尾：
print(re.findall(R"na[a-z]{3,10}e","my name is Alice,naicajoe,nattorirce"))

['naicajoe', 'nattorirce']

# 正则表达式匹配以na开头加上3个以上的小写字母并以e为结尾：
print(re.findall(R"na[a-z]{3,}e","my name is Alice,naicajoe,nattorighjrce"))

['naicajoe', 'nattorighjrce']

print(re.findall("\d+","12345678888888abc"))    # 尽量多的匹配
print(re.findall("\d*","12345678888888abc"))
print(re.findall("\d{3,}","12345678888888abc"))
print(re.findall("\d{3,8}","1234567888888888abc"))

['12345678888888']
['12345678888888', '', '', '', '']
['12345678888888']
['12345678', '88888888']

print(re.findall("\d+?","12345678888888abc"))
print(re.findall("\d{3,}?","12345678888888abc"))

['1', '2', '3', '4', '5', '6', '7', '8', '8', '8', '8', '8', '8', '8']
['123', '456', '788', '888']

^      开始位置
$      结束
\b     单词边界
\B     非单词边界

print(re.findall(r"^95\d{3}8$","958348"))

['958348']

str01 = "Use this toggle to the left to manage how your " \
        "browser uses BBC’s performance cookies. If you’re " \
        "outside the UK you can also use the toggle to set " \
        "your preferences for personalised advertising cookies."
pattern = re.compile(r"\b[abcABC][a-z]*\b")
print(pattern.findall(str01))

['browser', 'cookies', 'can', 'also', 'advertising', 'cookies']

import re
print(re.findall("\d{14}[0-9x]|\d{17}[0-9x]]","34262219971012x"))

['34262219971012x']

str01 = "Use this toggle to the left to manage how your " \
        "browser uses BBC’s performance cookies. If you’re " \
        "outside the UK you can also use the toggle to set " \
        "your preferences for personalised advertising cookies."
pattern = re.compile(r"\b[a-z]*(es|ing|er)\b")
print(pattern.findall(str01))

['er', 'es', 'es', 'es', 'ing', 'es']

import re
print(re.findall(r"\b([a-z])([a-z])[a-z]\2\1\b","fdadd abcba"))

[('a', 'b')]

import re
match_result = re.finditer(r"\b([a-z])([a-z])[a-z]\2\1\b","fdadd abcba")
match_list = []
for i in match_result:

Python正则表达式（上）

Python正则表达式（上）

一、正则表达式介绍

1. 正则表达式的匹配流程：

2. 正则表达式的应用流程

3.正则表达式的基本语法

二、预定义字符

1. 通配字符

2. 反斜杠

三、字符集

1. 系统正则表达式字符集

2. 用户自定义正则表达式字符集

四、正则表达式中量词

1. 三种量词符号

2. 花括号表示重复次数

3. 贪婪模式和非贪婪模式

五、字符边界

1. 字符串的开始和结束

2. 字符串的边界

六、逻辑判断

七、 分组

1. 捕获组与非捕获组