146 lines
5.2 KiB
Python
146 lines
5.2 KiB
Python
#!/usr/bin/env python
|
||
# -*- coding: utf- -*-
|
||
|
||
import argparse
|
||
from webdav3.client import Client
|
||
import os
|
||
import time
|
||
import re
|
||
import sys
|
||
import traceback
|
||
|
||
count=0
|
||
failcount=0
|
||
|
||
fullscan=True
|
||
|
||
def walk(client, current_path="/", output_file=None, replaceroot=None, lastpath=None):
|
||
global failcount
|
||
try:
|
||
items=client.list(current_path)
|
||
failcount=0
|
||
except KeyboardInterrupt:
|
||
print("get ctrl+c, exit")
|
||
sys.exit(1)
|
||
except:
|
||
traceback.print_exc()
|
||
time.sleep(1)
|
||
failcount+=1
|
||
if failcount>10:
|
||
sys.exit(1)
|
||
return
|
||
filetype_re=re.compile(r'\.(png|jpg|jpeg|bmp|gif|doc|nfo|flac|mp3|wma|ape|cue|wav|dst|dff|dts|ac3|eac3|txt|db|pdf)$')
|
||
# print(items)
|
||
for item in items[1:]:
|
||
full_path = f"{current_path}/{item}".replace("//", "/")
|
||
try:
|
||
# is_dir = client.is_dir(full_path)
|
||
is_dir = full_path.endswith("/")
|
||
except:
|
||
continue
|
||
global fullscan
|
||
# print(f"fullscan:{fullscan}, full_path:{full_path}, lastpath:{lastpath}")
|
||
if is_dir: # 判断是否为目录
|
||
#global count
|
||
#count=count+1
|
||
#if count%4==0:
|
||
# time.sleep(1)
|
||
if not fullscan and not full_path in lastpath:
|
||
continue
|
||
if full_path == lastpath:
|
||
fullscan = True
|
||
try:
|
||
walk(client, full_path, output_file, replaceroot, lastpath)
|
||
except KeyboardInterrupt:
|
||
print("get ctrl+c, exit")
|
||
sys.exit(1)
|
||
except:
|
||
time.sleep(1)
|
||
#sys.exit(1)
|
||
pass
|
||
elif not fullscan:
|
||
continue
|
||
else:
|
||
if filetype_re.search(full_path) != None or "BDMV" in full_path:
|
||
continue
|
||
size = int(client.info(full_path).get('size', 0))
|
||
if size>0 and size<4096:
|
||
continue
|
||
if replaceroot!=None:
|
||
if replaceroot=="":
|
||
# full_path=os.path.join("/",*full_path.split("/")[2:])
|
||
full_path = "/"+"/".join(full_path.split("/")[2:])
|
||
else:
|
||
# full_path=os.path.join("/",replaceroot,*full_path.split("/")[2:])
|
||
full_path = "/"+replaceroot+"/"+"/".join(full_path.split("/")[2:])
|
||
full_path = full_path.replace("//","/")
|
||
full_path = full_path.replace("\\/","|")
|
||
print(f"{full_path}\t{size}")
|
||
if output_file != None:
|
||
output_file.write(f"{full_path}\t{size}\n")
|
||
output_file.flush()
|
||
|
||
|
||
from urllib.parse import urlparse
|
||
|
||
def extract_url_components(url):
|
||
"""分解 URL 为 schema(协议)、hostname(主机地址)、path(路径)"""
|
||
parsed = urlparse(url)
|
||
|
||
# 提取核心组件
|
||
schema = parsed.scheme or "http" # 默认协议处理
|
||
hostname = f"{parsed.hostname}:{parsed.port}" # 自动过滤端口和认证信息
|
||
path = parsed.path.rstrip('/') or '/' # 路径标准化
|
||
|
||
return schema, hostname, path
|
||
|
||
|
||
def main():
|
||
parser = argparse.ArgumentParser(description='快速遍历WebDAV目录')
|
||
parser.add_argument('--url', type=str, required=True, help='WebDAV URL')
|
||
parser.add_argument('--username', type=str, required=True, help='WebDAV username')
|
||
parser.add_argument('--password', type=str, required=True, help='WebDAV password')
|
||
parser.add_argument('--output', type=str, required=True, help='输出文件')
|
||
parser.add_argument('--lastpath', type=str, default=None, required=False, help='最后扫到的路径(从此开始继续)')
|
||
parser.add_argument('--replaceroot', type=str, default=None, required=False, help='替换根目录名称')
|
||
args = parser.parse_args()
|
||
|
||
schema, hostname, path = extract_url_components(args.url)
|
||
print(schema,hostname,path)
|
||
|
||
options = {
|
||
'webdav_hostname': schema+"://"+hostname,
|
||
'webdav_root': '/',
|
||
'webdav_login': args.username,
|
||
'webdav_password': args.password,
|
||
'disable_check': True, # 跳过 SSL 证书验证:ml-citation{ref="6" data="citationList"}
|
||
'disable_head': True, # 跳过 SSL 证书验证:ml-citation{ref="6" data="citationList"}
|
||
}
|
||
client = Client(options)
|
||
|
||
print("WebDAV URL:", args.url)
|
||
if args.lastpath == None:
|
||
try:
|
||
with open(args.output, "r", encoding="utf-8") as f:
|
||
tmplines = f.readlines()
|
||
for i in range(len(tmplines)-1, -1, -1):
|
||
line=tmplines[i].strip()
|
||
if line != None and line != "":
|
||
args.lastpath = os.path.dirname(line.split("\t")[0])
|
||
break
|
||
except:
|
||
traceback.print_exc()
|
||
output_file = open(args.output, mode="a", encoding="utf-8")
|
||
if args.lastpath != None and args.lastpath != "":
|
||
global fullscan
|
||
fullscan = False
|
||
if args.lastpath != None:
|
||
if not args.lastpath.endswith("/"):
|
||
args.lastpath = args.lastpath+"/"
|
||
print(f"lastpath:{args.lastpath}")
|
||
walk(client, path, output_file,args.replaceroot, args.lastpath)
|
||
output_file.close()
|
||
|
||
if __name__ == '__main__':
|
||
main()
|