1.使用正则完成下列内容的匹配 - 匹配陕西省区号 029-12345 - 匹配邮政编码 745100 - 匹配邮箱 lijian@xianoupeng.com - 匹配身份证号 62282519960504337X
import re str1 = "029-12345" str2 = "745100" str3 = "lijian@xianoupeng.com" str4 = "62282519960504337X" #陕西省区号以029-开头 print(re.match("^029-\d*", str1)) #邮政编码为六位 print(re.match("\d{6}", str2)) #邮箱中间有@以.com结尾 print(re.search(".*@.*\.com$", str3)) #身份证固定18位末尾可能以数字或x/X结尾 print(re.search("\d{17}[\d|x|X]$", str4))2.爬取学校官网,获取所有图片途径并将路径存储在本地文件中,使用装饰器完成
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/116.0.0.0 Safari/537.36 Edg/116.0.1938.62'} #导入爬虫库 import requests import re #装饰器:存储在本地文件 def save(fn): def wrapper(*args, **kwargs): with open("picture_url.txt","a+",encoding="utf-8") as f: for i in fn(*args, **kwargs): f.write(i) return wrapper @save def get_picture(url): # 爬取数据 res = requests.get(url,headers=headers,verify=False) # 导入正则库 p = re.findall(r'<img src=".*?">',res.text) return p if __name__ == '__main__': url = "https://www.mdit.edu.cn/" picture = get_picture(url)3.小练习
屏幕录制 2026-02-07 160245