上传文件至 ''
Elevate your style with our [Wholesale Ring Jewelry](https://www.kirinjewelrywholesale.com/collections/925-sterling-silver-ring) collection. Crafted with precision and elegance, our sterling silver rings are timeless expressions of sophistication, meticulously polished for enduring beauty. Signed-off-by: kirinjewelry <kr13702570566@gmail.com>main
parent
874286fbea
commit
2500e17e40
@ -0,0 +1,48 @@
|
|||||||
|
import requests
|
||||||
|
import parsel
|
||||||
|
from tqdm import tqdm
|
||||||
|
import csv
|
||||||
|
import time
|
||||||
|
|
||||||
|
header = {
|
||||||
|
"user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/109.0.0.0 Safari/537.36"
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
def get_vidio(pageurl):
|
||||||
|
# pageurl = "https://www.kirinjewelry2006.com/video/products-detail-967094"
|
||||||
|
response = requests.get(url=pageurl, headers=header)
|
||||||
|
if response.status_code == 200:
|
||||||
|
res_text = response.text
|
||||||
|
select = parsel.Selector(res_text)
|
||||||
|
vidio_name = select.xpath('//*[@id="v620a34694dad7"]//h1/text()').get().split("-")[-1]
|
||||||
|
# print(vidio_name)
|
||||||
|
vidio_url = select.xpath('//*[@id="v620a34694dad7"]//img/@video-src').get()
|
||||||
|
vidio_res = requests.get(url=vidio_url,headers=header).content
|
||||||
|
|
||||||
|
with open('vidio\\{}.mp4'.format(vidio_name), 'wb') as file:
|
||||||
|
file.write(vidio_res)
|
||||||
|
print("{}视频已保存".format(vidio_name))
|
||||||
|
|
||||||
|
with open('vidio.csv', encoding="utf-8", mode='a', newline="") as f:
|
||||||
|
csv_writer = csv.writer(f)
|
||||||
|
csv_writer.writerow([vidio_name,])
|
||||||
|
time.sleep(5)
|
||||||
|
else:
|
||||||
|
print("无法获取视频")
|
||||||
|
|
||||||
|
for page in tqdm(range(2,87)):
|
||||||
|
print("正在爬取第{}页".format(page))
|
||||||
|
url = "https://www.kirinjewelry2006.com/products-list-{}".format(page)
|
||||||
|
response = requests.get(url=url,headers=header).text
|
||||||
|
select = parsel.Selector(response)
|
||||||
|
|
||||||
|
lis = select.xpath('//*[@id="v6204665765bf2"]/div/div[2]/div[2]//div[1]/ul/li')
|
||||||
|
for li in lis:
|
||||||
|
href = li.xpath('div/a/@href').get()
|
||||||
|
pageurl = "https://www.kirinjewelry2006.com" + href
|
||||||
|
# print(pageurl)
|
||||||
|
try:
|
||||||
|
get_vidio(pageurl)
|
||||||
|
except:
|
||||||
|
continue
|
||||||
@ -0,0 +1,15 @@
|
|||||||
|
import os
|
||||||
|
import csv
|
||||||
|
|
||||||
|
|
||||||
|
sku_list = []
|
||||||
|
with open("product_SKU.csv", "r", encoding="utf-8") as file:
|
||||||
|
for line in file:
|
||||||
|
sku_strlist = line.split(" ")
|
||||||
|
skustr = sku_strlist[-1].strip().replace("\"","")
|
||||||
|
sku_list.append(skustr)
|
||||||
|
|
||||||
|
for sku in sku_list:
|
||||||
|
with open("sku_product.csv", mode="a", encoding="utf-8", newline="") as f:
|
||||||
|
csv_writer = csv.writer(f)
|
||||||
|
csv_writer.writerow([sku,])
|
||||||
@ -0,0 +1,23 @@
|
|||||||
|
import requests
|
||||||
|
import parsel
|
||||||
|
from tqdm import tqdm
|
||||||
|
import time
|
||||||
|
import csv
|
||||||
|
|
||||||
|
header = {
|
||||||
|
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/109.0.0.0 Safari/537.36",
|
||||||
|
# "Cookie": "_bl_uid=g9ld3se62R4uz3xICmC3jksen8CO; member_id=1295895; pass_hash=60c367c69b5cd4b8ef6780634d5dd292; member_name=solaryusa; mqtids=%2C; session_id=4c04b006bf42205767eae453eb09c036; topicsread=a%3A1%3A%7Bi%3A358346%3Bi%3A1709013153%3B%7D"
|
||||||
|
}
|
||||||
|
|
||||||
|
for page in tqdm(range(0,5652,50)):
|
||||||
|
time.sleep(5)
|
||||||
|
url = "http://molbiol.ru/forums/index.php?showtopic=358346&st={}".format(page)
|
||||||
|
response = requests.get(url=url,headers=header).text
|
||||||
|
select = parsel.Selector(response)
|
||||||
|
links = select.xpath('//*[@id="ipbwrapper"]/div[2]//noindex/a/@href').getall()
|
||||||
|
for link in links:
|
||||||
|
with open("molbiol-ru潜在注册链接.csv", mode="a", encoding="utf-8", newline="") as f:
|
||||||
|
csv_writer = csv.writer(f)
|
||||||
|
csv_writer.writerow([link,])
|
||||||
|
|
||||||
|
|
||||||
Loading…
Reference in New Issue