jd 京东店铺链接获取

def page():

    html = browser.page_source
    html = bs(html,'lxml')
    cont = html.findAll('div',class_='jPage')[0]
    ss = len(cont.findAll('a'))
    d = '//*[@id="J_GoodsList"]/div/a[{0}]'.format(ss)
    print(d)
    browser.find_element_by_xpath(d).click()
    time.sleep(1)
    

def li():
    html = browser.page_source
    html = bs(html,'lxml')
    cont = html.findAll('li',class_='jSubObject gl-item')

    for i in cont:
        i = 'https:'+i.a.attrs['href']

        if i in shu:
            print('已经有了')
        else:
            shu.append(i)
            print(i)
            print(len(shu))
            print('\n')


def mall(s):

    for i in range(s):
        
        a = li()

        page()

        time.sleep(3)
        

shu =[]

猜你喜欢

转载自blog.csdn.net/AnYeZhiYin/article/details/105706688
今日推荐