正则表达式01-简单使用规则

import re

# 1. 匹配某个字符串:
text = "hello"
ret = re.match('he',text)
print(ret.group())

# 2. 点:匹配任意的字符
text = "\n"
ret = re.match('.',text)
print(ret.group())

# 3. \d:匹配任意的数字(0-9)
text = "1"
ret = re.match('\d',text)
print(ret.group())

# 4. \D:匹配任意的非数字
text = "a"
ret = re.match('\D',text)
print(ret.group())

# 5. \s:匹配空白字符(\n,\t,\r,空格)
text = "\r"
ret = re.match('\s',text)
print(ret.group())

# 6. \w:匹配的是a-z,A-Z,数字和下划线
text = "+"
ret = re.match('\w',text)
print(ret.group())

# 7. \W:与\w相反。
text = "a"
ret = re.match('\W',text)
print(ret.group())

# 8. []组合的方式,只要满足中括号中的字符,就可以匹配
text = "0731-88888888asfa"
ret = re.match('[\d\-]+',text)
print(ret.group())

# 8.1. 中括号的形式代替\d
text = "898234"
ret = re.match('[89]',text)
print(ret.group())

# 8.2. 中括号的形式代替\D
text = "1"
ret = re.match('[^0-9]',text)
print(ret.group())

# 8.3. 中括号的形式代替\w
text = "_"
ret = re.match('[a-zA-Z0-9_]',text)
print(ret.group())

# 8.4. 中括号的形式代替\W
text = "0"
ret = re.match('[^a-zA-Z0-9_]',text)
print(ret.group())


############ 匹配多个字符 ############
# 9. *:可以匹配0或者任意多个字符
text = "abcd"
ret = re.match('\s*',text)
print(ret.group())

# 10. +:匹配1个或者多个字符
text = "+abcd"
ret = re.match('\w+',text)#用*匹配不会报错
print(ret.group())

# 11. ?:匹配一个或者0个(要么没有,要么就只有一个)
text = "abcd"
ret = re.match('\w?',text)
print(ret.group())

# 12. {m}:匹配m个字符。
text = "abcd"
ret = re.match('\w{2}',text)
print(ret.group())

# 13. {m,n}:匹配m-n个字符
text = "abcdab"
ret = re.match('\w{1,5}',text)
print(ret.group())

############ 小案例 ############
# 14. 验证手机号码:
text = "12578900980"
ret = re.match('1[34578]\d{9}',text)
print(ret.group())

# 15. 验证邮箱:
text = "hynever12_@163com"
ret = re.match('\w+@[a-z0-9]+\.[a-z]+',text)
print(ret.group())

# 16. 验证URL
text = "https://baike.baidu.com/item/Python/407313?fr=aladdin"
ret = re.match('(http|https|ftp)://[^\s]+',text)
print(ret.group())

# 17. 验证身份证:
text = "31131118908123230a"
ret = re.match('\d{17}[\dxX]',text)
print(ret.group())

# 18. ^(脱字号):
text = "hello"
ret = re.search('^h',text)
print(ret.group())

# 19. $:表示以...结尾:
text = "xxx@163.com"
ret = re.match('\w+@163.com$',text)
print(ret.group())

# 20. |:匹配多个字符串或者表达式:
text = "https"
ret = re.match('(ftp|http|https)$',text)
print(ret.group())

# 21:贪婪模式与非贪婪模式:
text = "0123456"
ret = re.match('\d+?',text)
print(ret.group())

text = "<h1>标题</h1>"
ret = re.match('<.+?>',text)
print(ret.group())

# 22:匹配0-100之间的数字
# 可以出现的:1,2,3,10,100,99
# 有三种情况:1,99,100
# 不可以出现的:09,101
text = "01"
ret = re.match('[1-9]\d?$|100$',text)
print(ret.group())

  

posted @ 2020-03-13 11:31  胡辣汤王子  阅读(291)  评论(0编辑  收藏  举报