ComicScrapy/Comics/spiders/rm_comic.yml
2024-02-20 21:08:13 +08:00

41 lines
1.1 KiB
YAML

data:
name: '//div[@class="col"]/h5/text()'
icon: '//img[@class="img-thumbnail"]/@src'
author:
xpath: '//div[contains(@class,"bookid_bookInfo")]/p[1]/text()'
index: 1
tags: '//div[contains(@class,"bookid_bookInfo")]/p[3]/b/text()'
dep:
xpath: '//div[contains(@class,"bookid_bookInfo")]/p[4]/text()'
index: 1
date:
xpath: '//div[contains(@class,"bookid_bookInfo")]/p[5]/small/text()'
index: 1
genre:
value: "韩漫"
age_rating:
value: "R18+"
chapter_href: '//div[contains(@class,"bookid_chapterBox")]//div[contains(@class,"bookid_chapter")]/a/@href'
chapters: '//div[contains(@class,"bookid_chapterBox")]//div[contains(@class,"bookid_chapter")]/a/text()'
parse_chapter:
name:
sexec: props.pageProps.bookName
dep:
sexec: props.pageProps.description
chapter:
sexec: props.pageProps.chapterName
image_urls:
sexec: props.pageProps.images
images:
sexec: props.pageProps.images
chapter_api:
sexec: props.pageProps.chapterAPIPath
parse_chapter_api:
chapter:
sexec: chapter.name
image_urls:
sexec: chapter.images
images:
sexec: chapter.images