forked from nonomal/AVDC
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathAV_Data_Capture.py
executable file
·76 lines (71 loc) · 3.47 KB
/
AV_Data_Capture.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import os
from core import *
def movie_lists(escape_folder):
if escape_folder != '':
escape_folder = re.split('[,,]', escape_folder)
total = []
file_type = ['.mp4', '.avi', '.rmvb', '.wmv', '.mov', '.mkv', '.flv', '.ts', '.MP4', '.AVI', '.RMVB', '.WMV',
'.MOV', '.MKV', '.FLV', '.TS', ]
file_root = os.getcwd()
for root, dirs, files in os.walk(file_root):
if escape_folder != '':
flag_escape = 0
for folder in escape_folder:
if folder in root:
flag_escape = 1
break
if flag_escape == 1:
continue
for f in files:
if os.path.splitext(f)[1] in file_type:
path = root + '/' + f
path = path.replace(file_root, '.')
path = path.replace("\\\\", "/").replace("\\", "/")
total.append(path)
return total
def getNumber(filepath):
filepath = filepath.replace('-C.', '.').replace('-c.', '.')
filename = os.path.splitext(filepath.split('/')[-1])[0]
# filename = filename.replace("_", "-")
part = ''
if re.search('-CD\d+', filename):
part = re.findall('-CD\d+', filename)[0]
if re.search('-cd\d+', filename):
part = re.findall('-cd\d+', filename)[0]
filename = filename.replace(part, '')
filename = str(re.sub("-\d{4}-\d{1,2}-\d{1,2}", "", filename)) # 去除文件名中时间
filename = str(re.sub("\d{4}-\d{1,2}-\d{1,2}-", "", filename)) # 去除文件名中时间
if re.search('^\D+.\d{2}.\d{2}.\d{2}', filename): # 提取欧美番号 sexart.11.11.11
try:
file_number = re.search('\D+.\d{2}.\d{2}.\d{2}', filename).group()
return file_number
except:
return os.path.splitext(filepath.split('/')[-1])[0]
elif '-' in filename or '_' in filename: # 普通提取番号 主要处理包含减号-和_的番号
if 'FC2' or 'fc2' in filename:
filename = filename.replace('-PPV', '').replace('PPV-', '').replace('-ppv', '').replace('ppv-', '')
if re.search('\w+-\d+', filename): # 提取类似mkbd-120番号
file_number = re.search('\w+-\d+', filename).group()
elif re.search('\w+-\w\d+', filename): # 提取类似mkbd-s120番号
file_number = re.search('\w+-\w\d+', filename).group()
elif re.search('\d+-\w+', filename): # 提取类似 111111-MMMM 番号
file_number = re.search('\d+-\w+', filename).group()
elif re.search('\d+-\d+', filename): # 提取类似 111111-000 番号
file_number = re.search('\d+-\d+', filename).group()
elif re.search('\d+_\d+', filename): # 提取类似 111111_000 番号
file_number = re.search('\d+_\d+', filename).group()
else:
file_number = filename
return file_number
else: # 提取不含减号-的番号,FANZA CID 保留ssni00644,将MIDE139改成MIDE-139
try:
file_number = os.path.splitext(filename.split('/')[-1])[0]
find_num = re.findall(r'\d+', file_number)[0]
find_char = re.findall(r'\D+', file_number)[0]
if len(find_num) <= 4 and len(find_char) > 1:
file_number = find_char + '-' + find_num
return file_number
except:
return os.path.splitext(filepath.split('/')[-1])[0]