import re
def getUrl(string):
# findall() has been used
# with valid conditions for urls in string
regex = r"(?i)\b((?:https?://|www\d{0,3}[.]|[a-z0-9.\-]+[.][a-z]{2,4}/)(?:[^\s()<>]+|\(([^\s()<>]+|(\([^\s()<>]+\)))*\))+(?:\(([^\s()<>]+|(\([^\s()<>]+\)))*\)|[^\s`!()\[\]{};:'\".,<>?«»“”‘’]))"
url = re.findall(regex,string)
return [x[0] for x in url]
string = 'Python Program List: https://www.idoubi.net/blog/cat/python'
print(getUrl(string))
输出
https://www.idoubi.net/blog/cat/python
- 本文固定链接: http://jingyan.idoubi.net/4776.html
- 转载请注明: 搬运工 于 逗分享开发经验 发表