diff --git a/AV_Data_Capture.py b/AV_Data_Capture.py index 98de9c6..35315a0 100644 --- a/AV_Data_Capture.py +++ b/AV_Data_Capture.py @@ -71,8 +71,8 @@ if __name__ =='__main__': if '_' in i: os.rename(re.search(r'[^\\/:*?"<>|\r\n]+$', i).group(), rreplace(re.search(r'[^\\/:*?"<>|\r\n]+$', i).group(), '_', '-', 1)) i = rreplace(re.search(r'[^\\/:*?"<>|\r\n]+$', i).group(), '_', '-', 1) - os.system('python core.py' + ' "' + i + '"') #选择从py文件启动 (用于源码py) - #os.system('core.exe' + ' "' + i + '"') #选择从exe文件启动(用于EXE版程序) + #os.system('python core.py' + ' "' + i + '"') #选择从py文件启动 (用于源码py) + os.system('core.exe' + ' "' + i + '"') #选择从exe文件启动(用于EXE版程序) print("[*]=====================================") print("[!]Cleaning empty folders") diff --git a/core.py b/core.py index 9801d9d..c187076 100644 --- a/core.py +++ b/core.py @@ -108,9 +108,9 @@ def getNumberFromFilename(filepath): except: #添加 无需 正则表达式的规则 # ====================fc2fans_club.py=================== if 'fc2' in filename: - json_data = json.loads(fc2fans_club.main(file_number.strip('fc2_').strip('fc2-').strip('ppv-').strip('PPV-'))) + json_data = json.loads(fc2fans_club.main(file_number.strip('fc2_').strip('fc2-').strip('ppv-').strip('PPV-').strip('FC2_').strip('FC2-').strip('ppv-').strip('PPV-'))) elif 'FC2' in filename: - json_data = json.loads(fc2fans_club.main(file_number.strip('FC2_').strip('FC2-').strip('ppv-').strip('PPV-'))) + json_data = json.loads(fc2fans_club.main(file_number.strip('FC2_').strip('FC2-').strip('ppv-').strip('PPV-').strip('fc2_').strip('fc2-').strip('ppv-').strip('PPV-'))) #print(file_number.strip('FC2_').strip('FC2-').strip('ppv-').strip('PPV-')) #=======================javbus.py======================= else: @@ -156,6 +156,7 @@ def getNumberFromFilename(filepath): os._exit(0) path = '' #设置path为全局变量,后面移动文件要用 def creatFolder(): + global actor global path if len(actor) > 240: #新建成功输出文件夹 path = location_rule.replace("'actor'","'超多人'",3).replace("actor","'超多人'",3) #path为影片+元数据所在目录 @@ -164,7 +165,13 @@ def creatFolder(): path = location_rule #print(path) if not os.path.exists(path): - os.makedirs(path) + try: + os.makedirs(path) + except: + path = location_rule.replace(actor,"'其他'") + os.makedirs(path) + + #=====================资源下载部分=========================== def DownloadFileWithFilename(url,filename,path): #path = examle:photo , video.in the Project Folder! config = ConfigParser() diff --git a/siro.py b/siro.py index 3692bdd..ed8c84d 100644 --- a/siro.py +++ b/siro.py @@ -6,9 +6,12 @@ from bs4 import BeautifulSoup from ADC_function import * def getTitle(a): - html = etree.fromstring(a, etree.HTMLParser()) - result = str(html.xpath('//*[@id="center_column"]/div[2]/h1/text()')).strip(" ['']") - return result.replace('/',',') + try: + html = etree.fromstring(a, etree.HTMLParser()) + result = str(html.xpath('//*[@id="center_column"]/div[2]/h1/text()')).strip(" ['']") + return result.replace('/', ',') + except: + return '' def getActor(a): #//*[@id="center_column"]/div[2]/div[1]/div/table/tbody/tr[1]/td/text() html = etree.fromstring(a, etree.HTMLParser()) #//table/tr[1]/td[1]/text() result1=str(html.xpath('//th[contains(text(),"出演:")]/../td/a/text()')).strip(" ['']").strip('\\n ').strip('\\n') @@ -96,4 +99,4 @@ def main(number2): js = json.dumps(dic, ensure_ascii=False, sort_keys=True, indent=4, separators=(',', ':'),)#.encode('UTF-8') return js -#print(main('200GANA-1624')) \ No newline at end of file +#print(main('200GANA-1581')) \ No newline at end of file