From 8dda8da2b385e6e52a2dfd927fd18491d5785049 Mon Sep 17 00:00:00 2001 From: jnozsc Date: Sun, 16 Feb 2020 14:45:40 -0800 Subject: [PATCH] fix fanza hinban issue --- fanza.py | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/fanza.py b/fanza.py index 36e87ee..9457c27 100644 --- a/fanza.py +++ b/fanza.py @@ -83,6 +83,11 @@ def main(number): htmlcode=get_html('https://www.dmm.co.jp/mono/dvd/-/detail/=/cid='+number) url = 'https://www.dmm.co.jp/mono/dvd/-/detail/=/cid='+number try: + # for some old page, the input number does not match the page + # for example, the url will be cid=test012 + # but the hinban on the page is test00012 + # so get the hinban first, and then pass it to following functions + number = getNum(htmlcode) dic = { 'title': getTitle(htmlcode).strip(getActor(htmlcode)), 'studio': getStudio(htmlcode), @@ -91,15 +96,15 @@ def main(number): 'director': getDirector(htmlcode), 'actor': getActor(htmlcode), 'release': getRelease(htmlcode), - 'number': getNum(htmlcode), - 'cover': getCover(htmlcode,number), + 'number': number, + 'cover': getCover(htmlcode, number), 'imagecut': 1, 'tag': getTag(htmlcode), 'label':getLabel(htmlcode), 'year': getYear(getRelease(htmlcode)), # str(re.search('\d{4}',getRelease(a)).group()), 'actor_photo': '', 'website': url, - 'source': 'siro.py', + 'source': 'fanza.py', } except : dic = {