dead-cells-wiki/data/patch/31-2/outfits.py

35 lines
1,010 B
Python
Raw Normal View History

2022-10-07 11:37:25 +08:00
import scrapy
import sys
import requests
import io
sys.path.append("../../convert/31-2")
from db import *
db.bind(provider="sqlite", filename="../../clean/31-2/data.sqlite3")
db.generate_mapping()
class OutfitSpider(scrapy.Spider):
name = "outfits"
start_urls = [
"https://deadcells.fandom.com/wiki/Outfits",
]
def parse(self, response):
for quote in response.css(".wikitable tbody tr"):
name_en = quote.css("td:nth-child(2) > span:last-child::text").get()
if not name_en:
2022-10-13 17:35:47 +08:00
print(name_en)
2022-10-07 11:37:25 +08:00
continue
2022-10-13 17:35:47 +08:00
preview = quote.css(
"td:nth-child(6) > span:last-child a::attr('href')"
).get()
try:
r = requests.get(preview)
with db_session:
w = Outfit.select(name_en=name_en).first()
w.preview = io.BytesIO(r.content).getbuffer().tobytes()
except:
print("Preview not available.")