import requests
import re
import time
def analyze(url):
headers = {
'User-Agent': 'sadasdasqwweqw',
}
response = requests.get(url, headers=headers)
if response.status_code == 200:
txt = response.content.decode('utf-8')
b=re.findall(r'<a href="/free-videos/(\d+)" class="title"',txt)
for i in b:
urls='http://www.xxxxx.com/xxxxx/'+i
with open('av.txt','a+') as f:
f.write(urls+'\n')
def main():
for i in range(1,11):
url = "http://www.xxxxx.com/xxxxx/?p=%d"%i
analyze(url)
time.sleep(1)
#parser_page(url)
if __name__ == '__main__':
main()
python(一 爬虫---简单小视频)
猜你喜欢
转载自blog.csdn.net/Aidang/article/details/89790758
今日推荐
周排行