10.正则表达式

Posted 邹柯

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了10.正则表达式相关的知识,希望对你有一定的参考价值。

# 1.检查一串数字是否是电话号码
# 2.检查一个字符串是否符合email
# 3.把一个文本里指定的单词替换为另一个单词
import re
# a = C|C++|Java|C#|Python|javascript
# print(a.index(Python) > -1)  # True
# print(Python in a)           # True

# r=re.findall(Python,a)
# print(r)      # [Python]
# if len(r) > 0:
#     print(字符串中包含Python)
# else:
#     print(No)


# b = C0C++7Java8C#9Python6Javascript
# 查找所有的数字
# r=re.findall(\d,b)
# print(r)      # [0, 7, 8, 9, 6]
# 查找所有的非数字
# r=re.findall(\D,b)
# print(r)      # [C, C, +, +, J, a, v, a, C, #, P, y, t, h, o, n, J, a, v, a, s, c, r, i, p, t]


c = abc, acc, adc, aec, afc, ahc
# 查找中间一个字母是c或f的单词
# r=re.findall(a[cf]c,c)
# print(r)      # [acc, afc]
# 查找中间一个字母不是c并且也不是f的单词
# r=re.findall(a[^cf]c,c)
# print(r)      # [abc, adc, aec, ahc]
# 查找中间一个字母在c-f的单词
# r=re.findall(a[c-f]c,c)
# print(r)      # [acc, adc, aec, afc]


# 概括字符集
# \d \D
# \w 单词字符 \W
# \s 空白字符 \S
# .  匹配除换行符\n之外的所有字符
# e = python1111 java&6\t7\r8\n__php
# r=re.findall([0-9],e) 
# print(r)  # [1, 1, 1, 1, 6, 7, 8]
# r=re.findall([^0-9],e)
# print(r)  # [p, y, t, h, o, n,  , j, a, v, a, &, \t, \r, \n, _, _, p, h, p]
# r=re.findall(\w,e)  # \w等价于[A-Za-z0-9_]
# print(r)  # [p, y, t, h, o, n, 1, 1, 1, 1, j, a, v, a, 6, 7, 8, _, _, p, h, p]
# r=re.findall(\W,e)
# print(r)  # [ , &, \t, \r, \n]
# r=re.findall(\s,e)
# print(r)  # [ , \t, \r, \n]

# 数量词 
# * 匹配0次或无限多次
# + 匹配1次或无限多次
# ? 匹配0次或1次
# 贪婪匹配
# r=re.findall([a-z]{3,6},e)
# print(r)  # [python, java, php]
# 非贪婪匹配
# r=re.findall([a-z]{3,6}?,e)
# print(r)  # [pyt, hon, jav, php]

# f = pytho0python1pythonn2
# r=re.findall(python*,f)
# print(r)  # [pytho, python, pythonn]
# r=re.findall(python+,f)
# print(r)  # [python, pythonn]
# r=re.findall(python?,f)
# print(r)  # [pytho, python, python]

# 贪婪模式
# r=re.findall(python{1,2},f)
# print(r)  # [python, pythonn]
# 非贪婪模式
# r=re.findall(python{1,2}?,f)
# print(r)  # [python, python]


# 边界匹配
# qq = 100001
# 4~8位
# r=re.findall(\d{4,8},qq)
# print(r)  # [100001]
# qq2 = 100000001
# r=re.findall(^\d{4,8}$,qq2)
# print(r)  # []
# r=re.findall(000,qq2)
# print(r)  # [000, 000]
# r=re.findall(^000,qq2)
# print(r)  # []
# r=re.findall(000$,qq2)
# print(r)  # []

# 组 ()
# g = pythonpythonpythonpythonpythonJS
# r=re.findall((python){3}(JS),g)
# print(r)  # [python]

# lanage = PythonC#\nJavaPHP
# 忽略字母大小写匹配
# r=re.findall(c#,lanage,re.I)
# print(r)  # [C#]
# r=re.findall(c#.{1},lanage,re.I | re.S)
# print(r)  # [C#\n]

# 字符串替换
# lanage2 = PythonC#JavaC#PHPC#
# r = re.sub(C#,Go,lanage2,1)
# print(r)  # PythonGoJavaC#PHPC#
# r = re.sub(C#,Go,lanage2,0)
# print(r)  # PythonGoJavaGoPHPGo

# lanage = lanage2.replace(C#,Go)
# print(lanage)  # PythonGoJavaGoPHPGo


# def convert(value):
#     # print(value)  # <_sre.SRE_Match object; span=(6, 8), match=C#>
#                     # <_sre.SRE_Match object; span=(12, 14), match=C#>
#                     # <_sre.SRE_Match object; span=(17, 19), match=C#>
#     matched = value.group()
#     return !! + matched + !!

# r = re.sub(C#,convert,lanage2)
# print(r)  # Python!!C#!!Java!!C#!!PHP!!C#!!


s = A8C3721D86
# def convert(value):
#     matched = value.group()
#     if int(matched) >= 6:
#         return 9
#     else:
#         return 0

# r = re.sub(\d,convert,s)
# print(r)  # A9C0900D99

# 从字符串首字母开始匹配
# r = re.match(\d,s)
# print(r)  # None

# 搜索整个字符串直,返回第一次找到的字符串
# r = re.search(\d,s)
# print(r)   # <_sre.SRE_Match object; span=(1, 2), match=8>
# print(r.group())  # 8

# # 返回第一次查找到字符串的位置
# print(r.span())   # (1, 2)


# j = life is short,i use python
# r = re.search(life(.*)python,j)
# print(r.group(0))   # life is short,i use python
# print(r.group(1))   #  is short,i use 

# r = re.findall(life(.*)python,j)
# print(r)   # [ is short,i use ]

h = life is short,i use python,i love python
r = re.search(life(.*)python(.*)python,h)
# print(r.group(0))     # life is short,i use python,i love python
# print(r.group(1))     #  is short,i use
# print(r.group(2))     # ,i love
# print(r.group(0,1,2)) # (life is short,i use python,i love python,  is short,i use , ,i love )
# print(r.groups())     # ( is short,i use , ,i love )

 

以上是关于10.正则表达式的主要内容,如果未能解决你的问题,请参考以下文章

通过 Java 正则表达式提取 semver 版本字符串的片段

text 正则表达式片段

markdown 正则表达式模式片段

正则表达式匹配特定的 URL 片段而不是所有其他 URL 可能性

攻破难啃的骨头-正则表达式(转)

正则表达式的贪婪和非贪婪模式