198 lines
8.3 KiB
Python
198 lines
8.3 KiB
Python
import json,os,time,random,shutil
|
||
from utils.HtmlUtils import htmlUtils
|
||
from utils.FileUtils import imageUtils
|
||
from utils.comic.ComicInfo import comicInfo
|
||
from utils.CBZUtils import CBZUtils
|
||
from utils.downloader import download_images
|
||
from utils.downloader import download_comic_icon
|
||
from utils.Ntfy import ntfy
|
||
from utils.CBZUtils import verUtils
|
||
from utils.entity.down.RouMan import comicCommon
|
||
|
||
class baseComic:
|
||
count_chapter = 0
|
||
|
||
@classmethod
|
||
def downladsComcis(cls,book_name,comic_href,updated=None):
|
||
comicInfo.setComicName(book_name)
|
||
if updated != None:
|
||
comicInfo.setUpdateAt(updated)
|
||
random_int = random.randint(5,20)
|
||
comicInfo.setComicName(book_name)
|
||
dir_conf_comic = comicInfo.getDirConfComic()
|
||
if comicInfo.getIsComicNameSkips(book_name):
|
||
print(f"{book_name} 在白名单中,已跳过")
|
||
return None
|
||
if not os.path.exists(dir_conf_comic):
|
||
ntfy.sendMsg(f"{random_int}秒后开始下载 漫画:{book_name}")
|
||
time.sleep(random_int)
|
||
else:
|
||
ntfy.sendMsg(f"已存在 漫画:{book_name}")
|
||
if comicInfo.isUpdateComic():
|
||
return comic_href
|
||
else:
|
||
ntfy.sendMsg(f"{book_name} 已是最新")
|
||
chapters = htmlUtils.xpathData('//div[contains(@class,"bookid_chapterBox")]//div[contains(@class,"bookid_chapter")]/a/text()',url=comic_href,update=False)
|
||
chapter_index = 1
|
||
for chapter in chapters:
|
||
comicInfo.setChapterIndex(chapter_index)
|
||
comicInfo.setChapterName(chapter)
|
||
comicInfo.getNewCBZComicChapter()
|
||
comicInfo.getNewIconComicChapter()
|
||
chapter_index = chapter_index + 1
|
||
return None
|
||
|
||
#print(books)
|
||
#for comicHref in comicsHref:
|
||
# cls.oneComic(comicHref,random.uniform(10,20))
|
||
|
||
@classmethod
|
||
def oneComic(cls,url,title,author,icon,tags,dep,chapters,chapter_href,alias=None,genre="韩漫",lang="zh",sleep=None):
|
||
author = str(author).replace("&",",").replace(" ",",")
|
||
comicInfo.setHomePage(url)
|
||
comicInfo.setComicName(str(title))
|
||
if alias != None:
|
||
comicInfo.setComicNames(title+","+alias)
|
||
comicInfo.setAuthor(author)
|
||
comicInfo.setIcon(icon)
|
||
comicInfo.setTags(tags)
|
||
comicInfo.setDep(dep)
|
||
#comicInfo.setCBS("韩漫")
|
||
comicInfo.setGenre(genre)
|
||
comicInfo.setLang(lang)
|
||
comicInfo.setListChapter(chapters)
|
||
|
||
#comicUtils.setComic(title,alias,icon,author,tags,action,dep,update_date,chapters,chapter_href)
|
||
cls.count_chapter = 0
|
||
for href in chapter_href:
|
||
chapter = chapters[cls.count_chapter]
|
||
comicInfo.setChapterIndex(cls.count_chapter+1)
|
||
comicInfo.setChapterName(chapter)
|
||
if not comicInfo.nextExistsGetPath("done_"):
|
||
cls.comicChapter(href,scramble=True,sleep=random.randint(5,15))
|
||
#存在就校验CBZ包是否完整
|
||
if comicInfo.nextExistsGetPath("done_"):
|
||
verUtils.verCBZ()
|
||
cls.count_chapter += 1
|
||
#一本漫画下载后等待
|
||
#清空文件夹
|
||
path_dir_comic = comicInfo.getDirComic()
|
||
if os.path.exists(path_dir_comic):
|
||
shutil.rmtree(path_dir_comic)
|
||
if sleep != None:
|
||
time.sleep(sleep)
|
||
|
||
'''
|
||
|
||
读取某章节下所有图片
|
||
'''
|
||
@classmethod
|
||
def comicChapter(cls,chapter_url,scramble=None,sleep=None):
|
||
is_next = True
|
||
#try:
|
||
is_next = cls.Onechapter(chapter_url,scramble)
|
||
#进入下个阶段
|
||
if comicInfo.nextExistsGetPath("down_"):
|
||
#章节图片全部下载后,调用下载封面
|
||
download_comic_icon()
|
||
#下个阶段
|
||
if comicInfo.nextExistsGetPath("cbz_"):
|
||
time.sleep(0.1)
|
||
#下载后自动打包
|
||
is_next = CBZUtils.packAutoComicChapterCBZ()
|
||
#完成删除原文件
|
||
remove_path = comicInfo.getDirComicChapter()
|
||
if os.path.exists(remove_path):
|
||
shutil.rmtree(remove_path)
|
||
print(f"文件已删除: {remove_path}")
|
||
#except Exception as e:
|
||
# print(e)
|
||
# ntfy.sendMsg(f"{comicInfo.getComicName()} 下载出错了")
|
||
# is_next = False
|
||
ntfy.sendMsg(f"预计总章节大小:{cls.count_chapter + 1} / "+ str(comicInfo.getLenChapters()))
|
||
comicInfo.setChapterIndex(cls.count_chapter + 1)
|
||
if sleep != None and is_next == True:
|
||
ntfy.sendMsg(f"{sleep} 秒后开始下载下一个章节")
|
||
time.sleep(sleep)
|
||
|
||
|
||
@classmethod
|
||
def Onechapter(cls,chapter_url,scramble=None):
|
||
if not str(chapter_url).startswith("http"):
|
||
chapter_url = comicInfo.getBaseUrl() + chapter_url
|
||
try:
|
||
is_next = cls.comicChapterDownload(chapter_url)
|
||
except:
|
||
htmlUtils.remove_HtmlCache(chapter_url)
|
||
is_next = cls.comicChapterDownload(chapter_url)
|
||
comicInfo.nextInfoToImgChapter()
|
||
#下载完成后, 开始解密图片
|
||
chapter_dir = comicInfo.getDirComicChapter()
|
||
if scramble and os.path.exists(chapter_dir):
|
||
#获取章节图片路径
|
||
dirs = os.listdir(chapter_dir)
|
||
for img in dirs:
|
||
if img.startswith("scramble="):
|
||
c_path = os.path.join(chapter_dir, img)
|
||
#imageUtils.getScrambleImage(c_path)
|
||
imageUtils.encode_scramble_image(c_path)
|
||
#进入下一阶段
|
||
comicInfo.nextImgToDownloadChapter()
|
||
return is_next
|
||
|
||
@classmethod
|
||
def comicChapterDownload(cls,url):
|
||
comicCommon.comicChapterDownload(url)
|
||
list_img = comicInfo.getChapterListImg()
|
||
files_name = comicInfo.getChapterFilesName()
|
||
#netUtils.downloadComicChapterImages(list_img,scrambles=list_scramble)
|
||
chapter_name = comicInfo.getChapter()
|
||
book_name = comicInfo.getComicName()
|
||
comicInfo.setChapterImgs(list_img)
|
||
#保存图像
|
||
comicInfo.nextSaveInfoChapter(chapter_name, list_img)
|
||
#验证数据是已存在且是否完整
|
||
#cbz_path = comicInfo.getDirCBZComicChapter()+".CBZ"
|
||
cbz_path = comicInfo.getNewCBZComicChapter()+".CBZ"
|
||
#更新Icon
|
||
comicInfo.getNewIconComicChapter()
|
||
is_next = True
|
||
if os.path.exists(cbz_path):
|
||
try:
|
||
cbz_size = len(CBZUtils.zip_info(cbz_path)) - 1
|
||
except:
|
||
cbz_size = 0
|
||
if len(list_img) == cbz_size:
|
||
ntfy.sendMsg(f"{book_name} {chapter_name} 数据完整,已跳过")
|
||
comicInfo.nextDoneSave(list_img)
|
||
is_next = False
|
||
else:
|
||
ntfy.sendMsg(f"{book_name} {chapter_name} 数据不完整,尝试删除配置CBZ文件后重试")
|
||
try:
|
||
if cbz_size < len(list_img) or os.path.getsize(cbz_path) < 300000:
|
||
ntfy.sendMsg(f"删除 {cbz_path}")
|
||
os.remove(cbz_path)
|
||
else:
|
||
is_next = False
|
||
except:
|
||
ntfy(f"删除失败 {cbz_path}")
|
||
if is_next:
|
||
path_comic_info = comicInfo.getPathComicInfoXML()
|
||
if not os.path.exists(path_comic_info):
|
||
#print("不存在ComicInfo.xml 生成中...")
|
||
comicInfo.setPages(files_name)
|
||
comicInfo.writeComicInfoXML(chapter_name)
|
||
ntfy.sendMsg(f"{book_name} {chapter_name} 下载中")
|
||
is_next = verUtils.verNextCBZ(list_img)
|
||
repeat = 0
|
||
while not is_next or repeat <= 3:
|
||
download_images(list_img,comicInfo.getDirComicChapter(), filesName=files_name,timeout=180)
|
||
file_imgs = os.listdir(comicInfo.getDirComicChapter())
|
||
count_jpg = ",".join(file_imgs).split(".jpg")
|
||
is_next = len(count_jpg)-1 == len(list_img)
|
||
if not is_next:
|
||
sleep_time = 3+int(repeat)*2
|
||
time.sleep(sleep_time)
|
||
ntfy.sendMsg(f"下载数据({len(count_jpg)-1}/{len(list_img)})不完整,{sleep_time}秒钟后尝试第{repeat}次")
|
||
repeat += 1
|
||
return is_next |