python爬虫--08 淘宝比价


import requests
import re

def getHTMLText(url):
    try:
        r = requests.get(url)
        r.raise_for_status()
        r.encoding = 'utf-8'
        return r.text
    except:
        print('Fail')

def parsePage(html,ilt):
    try:
        tits = re.findall(r'\"raw_title\"\:\".*?\"',html)
        pris = re.findall(r'\"view_price\"\:\"[\d\.]*\"',html)
        for i in range(len(tits)):
            title = eval(tits[i].split(':')[1])
            price = eval(pris[i].split(':')[1])
            ilt.append([title,price])
    except:
        print("")


def printGoodsList(ilt):
    tplt = "{:4}\t{:32}\t{:8}"
    print(tplt.format("序号","商品名称","价格"))
    count = 0
    for g in ilt:
        count +=1
        print(tplt.format(count,g[0],g[1]))


def main():

    page =3
    goods = '书包'
    start_url = 'https://s.taobao.com/search?q=' + goods
    infolist = []
    for i in range(page):
        try:
            url = start_url  +'&s=' + str(44*i)
            html = getHTMLText(url)
            parsePage(html,infolist)
        except:
            continue

    printGoodsList(infolist)

main()

发布了108 篇原创文章 · 获赞 7 · 访问量 5188

猜你喜欢

转载自blog.csdn.net/qq_25672165/article/details/104906721