# coding:utf-8 import re import requests # 获取网页内容 url = raw_input('Input Link:') r = requests.get(url) data = r.text # 利用正则查找所有连接 link_list =re.findall(r"(?<=href=\").+?(?=\")|(?<=href=\').+?(?=\')" ,data) for url in link_list: url =re.findall(r"(?<=href=\").+?(?=\")|(?<=href=\').+?(?=\')" ,data) for url1 in url: print url1