商品SKU

会有一股神秘感。 提交于 2020-03-24 11:01:30
import  requestsimport reimport pandas as pdimport pymysqlpymysql.install_as_MySQLdb()from sqlalchemy import create_engineimport timeimport loggingheaders={"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Safari/537.36",                    'cookie': 'cna=YmdIFYYEcVMCATy+6cYV7pO7; t=adaf0c3bf86835603c597adfc1b0b875; hng=CN%7Czh-CN%7CCNY%7C156; thw=cn; tg=0; ali_ab=60.190.233.198.1556248533986.3; UM_distinctid=16a873f95f6326-0ab1211d27a5ca-f353163-1fa400-16a873f95f7987; mt=ci=33_1&np=; _tb_token_=NdGOJfjtYxmUxF6eBNYE; cookie2=1129bac788da762f2fc3dc2c31b61a38; v=0; _m_h5_tk=d3bac98f67e17d0491be6ac24fe972dd_1557735439567; _m_h5_tk_enc=d3390800dc68df57fc1b75bbb70cc8a5; unb=363984921; sg=312; _l_g_=Ug%3D%3D; skt=e40a50c529c9ca8e; cookie1=ACPl%2Ff%2BzGp66ZdFRG9knxI5XoCVXhR9WG1xO%2FUG4dwc%3D; csg=31b7be14; uc3=vt3=F8dBy3qIhOt5DMx3%2Bxo%3D&id2=UNaE8tOwscZl&nk2=szPwK%2FJkWAu%2FhoZP1cgV&lg2=UtASsssmOIJ0bQ%3D%3D; existShop=MTU1NzcyNTc0MQ%3D%3D; tracknick=%5Cu8C22%5Cu4F5C%5Cu5A01707924553; lgc=%5Cu8C22%5Cu4F5C%5Cu5A01707924553; _cc_=W5iHLLyFfA%3D%3D; dnk=%5Cu8C22%5Cu4F5C%5Cu5A01707924553; _nk_=%5Cu8C22%5Cu4F5C%5Cu5A01707924553; cookie17=UNaE8tOwscZl; uc1=cookie16=VT5L2FSpNgq6fDudInPRgavC%2BQ%3D%3D&cookie21=UIHiLt3xTIkz&cookie15=U%2BGCWk%2F75gdr5Q%3D%3D&existShop=false&pas=0&cookie14=UoTZ48JVyDnTlA%3D%3D&tag=8&lng=zh_CN; enc=4sdKSidVGl7W9qpdANZb5oGoKUO%2F1hBeMD%2F5tLQjGIhgPZ2J22LhXD%2FydDw7UFOd%2F%2FJ6YLTNDwpwUQY2wNZeHg%3D%3D; x=479184430%26e%3D1%26p%3D*%26s%3D0%26c%3D0%26f%3D0%26g%3D0%26t%3D0%26__ll%3D-1%26_ato%3D0; swfstore=299154; pnm_cku822=098%23E1hvnQvUvbpvUpCkvvvvvjiPRLSwAjlbn2SW1j3mPmPhtjiRRLM96jE8n2dO0jtPR8wCvvBvpvpZRphvChCvvvvPvpvhMMGvvvhCvvXvppvvvvvEvpCWBVTuv8RAnhhAcUmxdBQaUmx%2Fgj7xhpydfvc6lCAXal%2B0747BhC3qVmHoDOmOVzIUExjxALwp8BpDN%2BBljdUf8B6s%2BXZz%2BsBwN6fW0byCvm3vpvvvvvCvphCvh8pvvhR8phvwv9vvBj1vpCQmvvChxhCvjvUvvhBZkphvCyEmmvofVuyCvv3vpvoill%2FQg9%3D%3D; x5sec=7b2273686f7073797374656d3b32223a223233626530613037323138396631373133663036326535623934333633386633434f434c354f5946454a6a477a7669427770436278414561437a4d324d7a6b344e446b794d54737a227d; whl=-1%260%260%261557726692034; l=bBMrGiYVvCcIjkC2BOCwZQKXGi_OxIRAguSJGNzMi_5Ie1L_jw_Old9Lfep6Vj5R_VYB4UaStkw9-etkO; isg=BKWlldC2FX0WonE5blob6kQStGFz8kl4KxbRgqeKM1zrvsUwbzZBRQVWSGJtvnEs'}# conn1 = create_engine('mysql+mysqldb://xiaozhu:xiaozhu13579@47.110.87.60/douyin?charset=utf8mb4')# sql ='SELECT ID from 淘宝id'def goo(xh):    id_list =  pd.read_excel(r'C:\Users\mgxx\Desktop\淘宝id.xlsx')    # print(id_list)    for i  in range(xh,len(id_list['ID'])):        print(str(i)+'-------------------------------------------------------'+str(id_list['ID'].at[i]))        id=id_list['ID'].at[i]        url = 'https://item.taobao.com/item.htm?id=' + str(id)        try:            html=requests.get(url,headers=headers,timeout=5)            # print(html.text)            sku_list = re.findall(r'propertyMemoMap: {(".*?")}', html.text)            sku2_list = re.findall(r' <li title="(.*?)</li>', html.text)            title = re.findall(r'<title>(.*?)</title>', html.text)            sku = ''            sku2 = ''            if sku_list:                sku_list = sku_list[0].split(",")[::2]                for sk in sku_list:                    sku = sku + sk.split(":")[2]                title = title[0]                id = str(id)                conn = pymysql.connect(host="*", user="*", passwd="*", db="*")                sql = "replace  into 淘宝sku(SKU,title,id)values('" + sku + "','" + title + "','" + id + "')"                print(sql)                conn.query(sql)                conn.commit()            elif sku2_list:                sku2_list = sku2_list[0].split(",")                for sk1 in sku2_list:                    sku2 = sku2 + sk1                title = title[0]                id = str(id)                conn = pymysql.connect(host="*", user="*", passwd="*", db="*")                sql = "replace  into 淘宝sku(SKU,title,id)values('" + sku2 + "','" + title + "','" + id + "')"                print(sql)                conn.query(sql)                conn.commit()            else:                print('可能是邮费----',title)                continue            time.sleep(2)        except Exception as e:            logging.exception(e)            print('错了')            xh=i            return goo(xh)if __name__ == '__main__':    goo(0)
标签
易学教程内所有资源均来自网络或用户发布的内容,如有违反法律规定的内容欢迎反馈
该文章没有解决你所遇到的问题?点击提问,说说你的问题,让更多的人一起探讨吧!