You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
463 lines
18 KiB
463 lines
18 KiB
import yaml |
|
import oss2 |
|
from tqdm import tqdm |
|
import os |
|
import numpy as np |
|
import os |
|
import argparse |
|
# import bpy |
|
import sys |
|
import open3d as o3d |
|
|
|
from pathlib import Path |
|
|
|
import requests |
|
import json |
|
import shutil |
|
|
|
from config import url_get_oss_suffix_by_orderId |
|
|
|
from general import transform_save_bpy |
|
from general import read_models_from_json |
|
|
|
from compute_print_net import get_oss_client |
|
|
|
def download_transform_save_by_json(json_name, workdir, oss_config): |
|
layout_data = download_datas_by_json(json_name, workdir, oss_config) |
|
original_obj_pid_dir = workdir |
|
transform_save_bpy(layout_data, original_obj_pid_dir) |
|
|
|
class DataTransfer: |
|
''' |
|
数据传输类 |
|
''' |
|
def __init__(self, local_path: str, oss_path: str, oss_client: oss2.Bucket): |
|
''' |
|
local_path: 本地输出路径 |
|
oss_path: oss路径 |
|
oss_client: oss客户端 |
|
''' |
|
self.local_path = local_path |
|
self.oss_path = oss_path.lstrip('/') |
|
self.oss_client = oss_client |
|
# self.description = description |
|
|
|
# @log_execution(self.description) |
|
def download_data(self): |
|
""" |
|
从 OSS 下载数据到本地,保持原有目录结构 |
|
""" |
|
|
|
# 列出所有对象 |
|
objects = [] |
|
prefix = self.oss_path.lstrip('/') # 移除开头的 '/' 以匹配 OSS 格式 |
|
|
|
for obj in oss2.ObjectIterator(self.oss_client, prefix=prefix): |
|
if obj.key != prefix: # 跳过目录本身 |
|
objects.append(obj.key) |
|
|
|
# 下载所有文件,添加进度条 |
|
for obj_key in tqdm(objects, desc="下载进度"): |
|
if obj_key.endswith('/'): |
|
continue |
|
|
|
if "printId" in obj_key: |
|
continue |
|
|
|
# 计算相对路径 |
|
rel_path = obj_key[len(prefix):].lstrip('/') |
|
# 构建本地完整路径 |
|
local_path = os.path.join(self.local_path, rel_path) |
|
|
|
# 创建必要的目录 |
|
os.makedirs(os.path.dirname(local_path), exist_ok=True) |
|
|
|
# 下载文件 |
|
self.oss_client.get_object_to_file(obj_key, local_path) |
|
|
|
print("download_data local_path=" + local_path) |
|
|
|
order_id: str |
|
pid: str |
|
model_height: str |
|
|
|
def download_data_rename_json(self, json_model_info): |
|
""" |
|
从 OSS 下载数据到本地,保持原有目录结构 |
|
""" |
|
|
|
# 列出所有对象 |
|
objects = [] |
|
prefix = self.oss_path.lstrip('/') # 移除开头的 '/' 以匹配 OSS 格式 |
|
|
|
for obj in oss2.ObjectIterator(self.oss_client, prefix=prefix): |
|
if obj.key != prefix: # 跳过目录本身 |
|
objects.append(obj.key) |
|
|
|
# 下载所有文件,添加进度条 |
|
for obj_key in tqdm(objects, desc="下载进度"): |
|
if obj_key.endswith('/'): |
|
continue |
|
|
|
if "printId" in obj_key: |
|
continue |
|
|
|
# 计算相对路径 |
|
rel_path = obj_key[len(prefix):].lstrip('/') |
|
|
|
file_dir, file_name = os.path.split(rel_path) |
|
file_base, file_ext = os.path.splitext(file_name) |
|
|
|
# 根据文件后缀名进行重命名 |
|
if file_ext.lower() in ['.mtl', '.jpg', '.jpeg', '.png']: |
|
# 对于.mtl和图片文件,在原名前加order_id |
|
new_file_name = f"{json_model_info.order_id}_{file_name}" |
|
# new_file_name = file_name |
|
elif file_ext.lower() == '.obj': |
|
# 对于.obj文件,完全重命名 |
|
new_file_name = f"{json_model_info.obj_name}" |
|
else: |
|
# 其他文件类型保持原名 |
|
new_file_name = file_name |
|
print("new_file_name=", new_file_name) |
|
|
|
# 构建新的相对路径 |
|
if file_dir: # 如果有子目录 |
|
new_rel_path = os.path.join(file_dir, new_file_name) |
|
else: |
|
new_rel_path = new_file_name |
|
|
|
# 构建本地完整路径 |
|
local_path = os.path.join(self.local_path, new_rel_path) |
|
|
|
# 创建必要的目录 |
|
os.makedirs(os.path.dirname(local_path), exist_ok=True) |
|
|
|
# 下载文件 |
|
self.oss_client.get_object_to_file(obj_key, local_path) |
|
|
|
if file_ext == '.obj': # 10MB以上 |
|
try: |
|
# 使用临时文件避免内存问题 [8](@ref) |
|
temp_path = local_path + '.tmp' |
|
with open(local_path, 'r', encoding='utf-8') as f_in, \ |
|
open(temp_path, 'w', encoding='utf-8') as f_out: |
|
|
|
mtllib_modified = False |
|
for line in f_in: |
|
if not mtllib_modified and line.strip().startswith('mtllib '): |
|
parts = line.split(' ', 1) |
|
if len(parts) > 1: |
|
old_mtl_name = parts[1].strip() |
|
new_mtl_name = f"{json_model_info.order_id}_{old_mtl_name}" |
|
f_out.write(f"mtllib {new_mtl_name}\n") |
|
mtllib_modified = True |
|
continue |
|
f_out.write(line) |
|
|
|
os.replace(temp_path, local_path) # 原子性替换 |
|
|
|
except IOError as e: |
|
print(f"处理大文件 {local_path} 时出错: {e}") |
|
if os.path.exists(temp_path): |
|
os.remove(temp_path) |
|
|
|
# 优化后的.obj文件处理逻辑 |
|
if file_ext == '.mtl': |
|
try: |
|
# 使用更高效的文件读取方式 [6,8](@ref) |
|
with open(local_path, 'r', encoding='utf-8') as f: |
|
content = f.read() |
|
|
|
# 使用字符串方法直接查找和替换,避免不必要的循环 [9](@ref) |
|
lines = content.split('\n') |
|
mtllib_modified = False |
|
|
|
for i, line in enumerate(lines): |
|
stripped_line = line.strip() |
|
if not mtllib_modified and stripped_line.startswith('map_Kd '): |
|
# 更高效的分割方式 [9](@ref) |
|
parts = line.split(' ', 1) |
|
if len(parts) > 1: |
|
old_name = parts[1].strip() |
|
new_name = f"{json_model_info.order_id}_{old_name}" |
|
lines[i] = f"map_Kd {new_name}" |
|
mtllib_modified = True |
|
# print(f"已更新材质库引用: {old_name} -> {new_name}") |
|
break # 找到第一个后立即退出 |
|
|
|
# 批量写入,减少I/O操作 [6](@ref) |
|
with open(local_path, 'w', encoding='utf-8') as f: |
|
f.write('\n'.join(lines)) |
|
|
|
except IOError as e: |
|
print(f"处理文件 {local_path} 时出错: {e}") |
|
except UnicodeDecodeError as e: |
|
print(f"文件编码错误 {local_path}: {e}") |
|
|
|
print(f"下载文件: {obj_key} -> {local_path}") |
|
|
|
def download_data_rename_batch(self, batch_model_info): |
|
""" |
|
从 OSS 下载数据到本地,保持原有目录结构 |
|
""" |
|
|
|
# 列出所有对象 |
|
objects = [] |
|
prefix = self.oss_path.lstrip('/') # 移除开头的 '/' 以匹配 OSS 格式 |
|
|
|
prefix_exists = False |
|
|
|
for obj in oss2.ObjectIterator(self.oss_client, prefix=prefix): |
|
prefix_exists = True |
|
if obj.key != prefix: # 跳过目录本身 |
|
objects.append(obj.key) |
|
# print(f"obj.key={obj.key}") |
|
|
|
if not prefix_exists: |
|
print(f"前缀 '{prefix}' 下没有找到任何文件或目录。") |
|
return False |
|
else: |
|
print(f"前缀 '{prefix}' 存在,共找到 {len(objects)} 个对象。") |
|
|
|
# 下载所有文件,添加进度条 |
|
for obj_key in tqdm(objects, desc="下载进度"): |
|
if obj_key.endswith('/'): |
|
# print("下载 endswith('/'") |
|
continue |
|
|
|
if "printId" in obj_key: |
|
# print(f"下载 in obj_key") |
|
continue |
|
|
|
# 计算相对路径 |
|
rel_path = obj_key[len(prefix):].lstrip('/') |
|
|
|
file_dir, file_name = os.path.split(rel_path) |
|
file_base, file_ext = os.path.splitext(file_name) |
|
|
|
# 根据文件后缀名进行重命名 |
|
if file_ext.lower() in ['.mtl', '.jpg', '.jpeg', '.png']: |
|
# 对于.mtl和图片文件,在原名前加order_id |
|
new_file_name = f"{batch_model_info.order_id}_{file_name}" |
|
# new_file_name = file_name |
|
elif file_ext.lower() == '.obj': |
|
# 对于.obj文件,完全重命名 |
|
new_file_name = f"{batch_model_info.order_id}_{batch_model_info.pid}_P{batch_model_info.print_order_id}_{batch_model_info.model_size}{file_ext}" |
|
else: |
|
# 其他文件类型保持原名 |
|
new_file_name = file_name |
|
|
|
# 构建新的相对路径 |
|
if file_dir: # 如果有子目录 |
|
new_rel_path = os.path.join(file_dir, new_file_name) |
|
else: |
|
new_rel_path = new_file_name |
|
|
|
# 构建本地完整路径 |
|
local_path = os.path.join(self.local_path, new_rel_path) |
|
|
|
# 创建必要的目录 |
|
os.makedirs(os.path.dirname(local_path), exist_ok=True) |
|
|
|
# 下载文件 |
|
self.oss_client.get_object_to_file(obj_key, local_path) |
|
|
|
if file_ext == '.obj': # 10MB以上 |
|
try: |
|
# 使用临时文件避免内存问题 [8](@ref) |
|
temp_path = local_path + '.tmp' |
|
with open(local_path, 'r', encoding='utf-8') as f_in, \ |
|
open(temp_path, 'w', encoding='utf-8') as f_out: |
|
|
|
mtllib_modified = False |
|
for line in f_in: |
|
if not mtllib_modified and line.strip().startswith('mtllib '): |
|
parts = line.split(' ', 1) |
|
if len(parts) > 1: |
|
old_mtl_name = parts[1].strip() |
|
new_mtl_name = f"{batch_model_info.order_id}_{old_mtl_name}" |
|
f_out.write(f"mtllib {new_mtl_name}\n") |
|
mtllib_modified = True |
|
print("len(parts) > 1") |
|
continue |
|
f_out.write(line) |
|
|
|
os.replace(temp_path, local_path) # 原子性替换 |
|
|
|
except IOError as e: |
|
print(f"处理大文件 {local_path} 时出错: {e}") |
|
if os.path.exists(temp_path): |
|
os.remove(temp_path) |
|
|
|
# 优化后的.obj文件处理逻辑 |
|
if file_ext == '.mtl': |
|
try: |
|
# 使用更高效的文件读取方式 [6,8](@ref) |
|
with open(local_path, 'r', encoding='utf-8') as f: |
|
content = f.read() |
|
|
|
# 使用字符串方法直接查找和替换,避免不必要的循环 [9](@ref) |
|
lines = content.split('\n') |
|
mtllib_modified = False |
|
|
|
for i, line in enumerate(lines): |
|
stripped_line = line.strip() |
|
if not mtllib_modified and stripped_line.startswith('map_Kd '): |
|
# 更高效的分割方式 [9](@ref) |
|
parts = line.split(' ', 1) |
|
if len(parts) > 1: |
|
old_name = parts[1].strip() |
|
new_name = f"{batch_model_info.order_id}_{old_name}" |
|
lines[i] = f"map_Kd {new_name}" |
|
mtllib_modified = True |
|
# print(f"已更新材质库引用: {old_name} -> {new_name}") |
|
break # 找到第一个后立即退出 |
|
|
|
# 批量写入,减少I/O操作 [6](@ref) |
|
with open(local_path, 'w', encoding='utf-8') as f: |
|
f.write('\n'.join(lines)) |
|
|
|
except IOError as e: |
|
print(f"处理文件 {local_path} 时出错: {e}") |
|
except UnicodeDecodeError as e: |
|
print(f"文件编码错误 {local_path}: {e}") |
|
|
|
print(f"下载文件: {obj_key} -> {local_path}") |
|
|
|
return True |
|
|
|
def download_single_file(self): |
|
""" |
|
下载单个文件从OSS到本地 |
|
""" |
|
# 确保本地目录存在 |
|
os.makedirs(os.path.dirname(self.local_path), exist_ok=True) |
|
|
|
# 直接下载文件 |
|
try: |
|
self.oss_client.get_object_to_file(self.oss_path, self.local_path) |
|
print(f"文件已下载到: {self.local_path}") |
|
except oss2.exceptions.NoSuchKey: |
|
print(f"OSS文件不存在: {self.oss_path}") |
|
|
|
def upload_data(self): |
|
''' |
|
上传数据到OSS |
|
''' |
|
# 检测本地路径是否存在 |
|
if not os.path.exists(self.local_path): |
|
raise FileNotFoundError(f"本地路径不存在: {self.local_path}") |
|
|
|
# 判断本地路径是文件还是目录 |
|
if os.path.isfile(self.local_path): |
|
local_suffix = Path(self.local_path).suffix |
|
oss_suffix = Path(self.oss_path).suffix |
|
|
|
if oss_suffix and oss_suffix != local_suffix: |
|
# 后缀名不一致,上传到指定文件夹下的同名文件 |
|
oss_dir = os.path.dirname(self.oss_path) |
|
oss_target_path = os.path.join(oss_dir, os.path.basename(self.local_path)) |
|
else: |
|
# 后缀名一致,上传到指定OSS路径 |
|
oss_target_path = self.oss_path |
|
|
|
# 上传文件 |
|
self.oss_client.put_object_from_file(oss_target_path, self.local_path) |
|
|
|
print(f"文件已上传到: {oss_target_path}") |
|
|
|
elif os.path.isdir(self.local_path): |
|
oss_suffix = Path(self.oss_path).suffix |
|
if oss_suffix: |
|
raise ValueError("不能将目录上传到具有后缀名的OSS路径。") |
|
|
|
# 遍历本地目录并上传 |
|
for root, dirs, files in os.walk(self.local_path): |
|
for file in files: |
|
local_file_path = os.path.join(root, file) |
|
relative_path = os.path.relpath(local_file_path, self.local_path) |
|
oss_file_path = os.path.join(self.oss_path, relative_path).replace("\\", "/") |
|
|
|
# 创建必要的目录 |
|
oss_dir = os.path.dirname(oss_file_path) |
|
|
|
# 上传文件 |
|
self.oss_client.put_object_from_file(oss_file_path, local_file_path) |
|
print(f"文件已上传到: {oss_file_path}") |
|
else: |
|
raise ValueError(f"无效的本地路径类型: {self.local_path}") |
|
|
|
def get_api(url): |
|
try: |
|
response = requests.get(url) |
|
response.raise_for_status() # 检查请求是否成功 |
|
response = json.loads(response.text) |
|
if response.get("code") != 1000: |
|
raise Exception(f"Error fetching URL {url}: {response.get('message')}") |
|
else: |
|
return response |
|
except requests.exceptions.RequestException as e: |
|
raise Exception(f"Error fetching URL {url}: {e}") |
|
|
|
def download_data_by_json(model_info, workdir, oss_client ): |
|
try: |
|
pid = model_info.pid |
|
model_height = model_info.model_height |
|
target_dir = f"{workdir}" |
|
|
|
url = f"{url_get_oss_suffix_by_orderId}{model_info.order_id}" |
|
res = requests.get(url) |
|
|
|
data = res.json()["data"] |
|
# print("datas=",data) |
|
data = data.replace("/init_obj", "") |
|
|
|
print("target_dir=", target_dir) |
|
download_textures = DataTransfer(target_dir, f"objs/download/print/{pid}/{data}/{model_height}/", oss_client) |
|
|
|
download_textures.download_data_rename_json(model_info) |
|
# 下载后检查目标文件夹是否为空 |
|
if os.path.exists(target_dir) and not os.listdir(target_dir): |
|
shutil.rmtree(target_dir) |
|
print(f"下载后检查发现目标文件夹为空,已删除: {target_dir}") |
|
except Exception as e: |
|
print(f"下载失败: {pid}, 错误: {str(e)}") |
|
pass |
|
|
|
def download_datas_by_json(pid_file, workdir, oss_config): |
|
oss_client = get_oss_client(oss_config) |
|
|
|
json_path = os.path.join(workdir, f"{pid_file}.json") |
|
|
|
# 读取所有PID |
|
list_model_info, json_data = read_models_from_json(json_path) |
|
print(f"从文件读取了 {len(list_model_info)} 个PID") |
|
# 批量下载 |
|
for model_info in list_model_info: |
|
print(f"开始下载PID: {model_info}") |
|
download_data_by_json(model_info, args.workdir, oss_client) |
|
|
|
return json_data |
|
|
|
if __name__ == "__main__": |
|
|
|
script_args = [] |
|
|
|
try: |
|
separator_index = sys.argv.index("--") |
|
script_args = sys.argv[separator_index + 1:] |
|
except ValueError: |
|
pass |
|
|
|
parser = argparse.ArgumentParser() |
|
|
|
parser.add_argument("--pid_file", type=str, required=True, help="批次号, 也是json文件名") |
|
parser.add_argument("--workdir", type=str, required=True, help="json文件所在的目录") |
|
parser.add_argument("--oss_config", type=str, required=True, help="run.yaml所在的目录") |
|
args = parser.parse_args(script_args) |
|
|
|
download_transform_save_by_json(args.pid_file, args.workdir, args.oss_config) |
|
|
|
# blender --background --python download_print_out.py -- --pid_file {your_batch_id} --workdir {your_batch_dir} --oss_config {your_yaml_dir/run.yaml} |
|
|