"""
CAD模型处理脚本
功能：将STEP格式的CAD模型转换为结构化数据，包括：
- 几何信息：面、边、顶点的坐标数据
- 拓扑信息：面-边-顶点的邻接关系
- 空间信息：包围盒数据
"""

import os
import pickle  # 用于数据序列化
import argparse  # 命令行参数解析
import numpy as np
from tqdm import tqdm  # 进度条显示
from concurrent.futures import ProcessPoolExecutor, as_completed, TimeoutError  # 并行处理
import logging
from datetime import datetime

# 创建logs目录
os.makedirs('logs', exist_ok=True)

# 设置日志记录器
logger = logging.getLogger(__name__)
logger.setLevel(logging.INFO)

# 创建格式化器
formatter = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')

# 创建文件处理器
current_time = datetime.now().strftime('%Y%m%d_%H%M%S')
log_file = f'logs/process_brep_{current_time}.log'
file_handler = logging.FileHandler(log_file, encoding='utf-8')
file_handler.setLevel(logging.INFO)
file_handler.setFormatter(formatter)

# 添加文件处理器到日志记录器
logger.addHandler(file_handler)

# 记录脚本开始执行
logger.info("="*50)
logger.info("Script started")
logger.info(f"Log file: {log_file}")
logger.info("="*50)

# 导入OpenCASCADE相关库
from OCC.Core.STEPControl import STEPControl_Reader  # STEP文件读取器
from OCC.Core.TopExp import TopExp_Explorer, topexp  # 拓扑结构遍历
from OCC.Core.TopAbs import TopAbs_FACE, TopAbs_EDGE, TopAbs_VERTEX  # 拓扑类型定义
from OCC.Core.BRep import BRep_Tool  # B-rep工具
from OCC.Core.BRepMesh import BRepMesh_IncrementalMesh  # 网格剖分
from OCC.Core.TopLoc import TopLoc_Location  # 位置变换
from OCC.Core.IFSelect import IFSelect_RetDone  # 操作状态码
from OCC.Core.TopTools import TopTools_IndexedDataMapOfShapeListOfShape  # 形状映射
from OCC.Core.BRepBndLib import brepbndlib  # 包围盒计算
from OCC.Core.Bnd import Bnd_Box  # 包围盒
from OCC.Core.TopoDS import TopoDS_Shape, topods, TopoDS_Vertex  # 拓扑数据结构

# 设置最大面数阈值，用于加速处理
MAX_FACE = 70

def normalize(surfs, edges, corners):
    """
    将CAD模型归一化到单位立方体空间
    
    参数:
        surfs: 面的点集列表
        edges: 边的点集列表
        corners: 顶点坐标列表
    
    返回:
        surfs_wcs: 原始坐标系下的面点集
        edges_wcs: 原始坐标系下的边点集
        surfs_ncs: 归一化坐标系下的面点集
        edges_ncs: 归一化坐标系下的边点集
        corner_wcs: 归一化后的顶点坐标
    """
    if len(corners) == 0:
        return None, None, None, None, None
        
    # 计算包围盒和缩放因子
    corners_array = np.array(corners)
    center = (corners_array.max(0) + corners_array.min(0)) / 2  # 计算中心点
    scale = 1.0 / (corners_array.max(0) - corners_array.min(0)).max()  # 计算缩放系数
    
    # 归一化面的点集
    surfs_wcs = []  # 原始世界坐标系下的面点集
    surfs_ncs = []  # 归一化坐标系下的面点集
    for surf in surfs:
        surf_wcs = np.array(surf)
        surf_ncs = (surf_wcs - center) * scale  # 归一化变换
        surfs_wcs.append(surf_wcs)
        surfs_ncs.append(surf_ncs)
    
    # 归一化边的点集
    edges_wcs = []  # 原始世界坐标系下的边点集
    edges_ncs = []  # 归一化坐标系下的边点集
    for edge in edges:
        edge_wcs = np.array(edge)
        edge_ncs = (edge_wcs - center) * scale  # 归一化变换
        edges_wcs.append(edge_wcs)
        edges_ncs.append(edge_ncs)
    
    # 归一化顶点坐标
    corner_wcs = (corners_array - center) * scale
    
    return (np.array(surfs_wcs, dtype=object), 
            np.array(edges_wcs, dtype=object),
            np.array(surfs_ncs, dtype=object), 
            np.array(edges_ncs, dtype=object),
            corner_wcs)

def get_adjacency_info(shape):
    """
    获取CAD模型中面、边、顶点之间的邻接关系
    
    参数:
        shape: CAD模型的形状对象
    
    返回:
        edgeFace_adj: 边-面邻接矩阵 (num_edges × num_faces)
        faceEdge_adj: 面-边邻接矩阵 (num_faces × num_edges)
        edgeCorner_adj: 边-顶点邻接矩阵 (num_edges × 2)
    """
    # 创建边-面映射关系
    edge_face_map = TopTools_IndexedDataMapOfShapeListOfShape()
    topexp.MapShapesAndAncestors(shape, TopAbs_EDGE, TopAbs_FACE, edge_face_map)
    
    # 获取所有几何元素
    faces = []  # 存储所有面
    edges = []  # 存储所有边
    vertices = []  # 存储所有顶点
    
    # 创建拓扑结构探索器
    face_explorer = TopExp_Explorer(shape, TopAbs_FACE)
    edge_explorer = TopExp_Explorer(shape, TopAbs_EDGE)
    vertex_explorer = TopExp_Explorer(shape, TopAbs_VERTEX)
    
    # 收集所有几何元素
    while face_explorer.More():
        faces.append(topods.Face(face_explorer.Current()))
        face_explorer.Next()
        
    while edge_explorer.More():
        edges.append(topods.Edge(edge_explorer.Current()))
        edge_explorer.Next()
        
    while vertex_explorer.More():
        vertices.append(topods.Vertex(vertex_explorer.Current()))
        vertex_explorer.Next()
    
    # 创建邻接矩阵
    num_faces = len(faces)
    num_edges = len(edges)
    num_vertices = len(vertices)
    
    edgeFace_adj = np.zeros((num_edges, num_faces), dtype=np.int32)
    faceEdge_adj = np.zeros((num_faces, num_edges), dtype=np.int32)
    edgeCorner_adj = np.zeros((num_edges, 2), dtype=np.int32)
    
    # 填充边-面邻接矩阵
    for i, edge in enumerate(edges):
        # 检查每个面是否与当前边相连
        for j, face in enumerate(faces):
            edge_explorer = TopExp_Explorer(face, TopAbs_EDGE)
            while edge_explorer.More():
                if edge.IsSame(edge_explorer.Current()):
                    edgeFace_adj[i, j] = 1
                    faceEdge_adj[j, i] = 1
                    break
                edge_explorer.Next()
        
        # 获取边的两个端点
        v1 = TopoDS_Vertex()
        v2 = TopoDS_Vertex()
        topexp.Vertices(edge, v1, v2)
        
        # 记录边的端点索引
        if not v1.IsNull() and not v2.IsNull():
            v1_vertex = topods.Vertex(v1)
            v2_vertex = topods.Vertex(v2)
            
            for k, vertex in enumerate(vertices):
                if v1_vertex.IsSame(vertex):
                    edgeCorner_adj[i, 0] = k
                if v2_vertex.IsSame(vertex):
                    edgeCorner_adj[i, 1] = k
    
    return edgeFace_adj, faceEdge_adj, edgeCorner_adj

def get_bbox(shape, subshape):
    """
    计算形状的包围盒
    
    参数:
        shape: 完整的CAD模型形状
        subshape: 需要计算包围盒的子形状（面或边）
    
    返回:
        包围盒的六个参数 [xmin, ymin, zmin, xmax, ymax, zmax]
    """
    bbox = Bnd_Box()
    brepbndlib.Add(subshape, bbox)
    xmin, ymin, zmin, xmax, ymax, zmax = bbox.Get()
    return np.array([xmin, ymin, zmin, xmax, ymax, zmax])

def parse_solid(step_path):
    """Parse the surface, curve, face, edge, vertex in a CAD solid using OCC."""
    # Load STEP file
    reader = STEPControl_Reader()
    status = reader.ReadFile(step_path)
    if status != IFSelect_RetDone:
        raise Exception("Failed to read STEP file")
    
    reader.TransferRoots()
    shape = reader.OneShape()
    
    # Create mesh
    mesh = BRepMesh_IncrementalMesh(shape, 0.01)
    mesh.Perform()
    
    # Initialize explorers
    face_explorer = TopExp_Explorer(shape, TopAbs_FACE)
    edge_explorer = TopExp_Explorer(shape, TopAbs_EDGE)
    vertex_explorer = TopExp_Explorer(shape, TopAbs_VERTEX)
    
    face_pnts = []
    edge_pnts = []
    corner_pnts = []
    surf_bbox_wcs = []
    edge_bbox_wcs = []
    
    # Extract face points
    while face_explorer.More():
        face = topods.Face(face_explorer.Current())
        loc = TopLoc_Location()
        triangulation = BRep_Tool.Triangulation(face, loc)
        
        if triangulation is not None:
            points = []
            for i in range(1, triangulation.NbNodes() + 1):
                node = triangulation.Node(i)
                pnt = node.Transformed(loc.Transformation())
                points.append([pnt.X(), pnt.Y(), pnt.Z()])
                
            if points:
                points = np.array(points, dtype=np.float32)
                if len(points.shape) == 2 and points.shape[1] == 3:
                    face_pnts.append(points)
                    surf_bbox_wcs.append(get_bbox(shape, face))
        
        face_explorer.Next()
    
    # Extract edge points
    num_samples = 100
    while edge_explorer.More():
        edge = topods.Edge(edge_explorer.Current())
        curve, first, last = BRep_Tool.Curve(edge)
        
        if curve is not None:
            points = []
            for i in range(num_samples):
                param = first + (last - first) * float(i) / (num_samples - 1)
                pnt = curve.Value(param)
                points.append([pnt.X(), pnt.Y(), pnt.Z()])
            
            if points:
                points = np.array(points, dtype=np.float32)
                if len(points.shape) == 2 and points.shape[1] == 3:
                    edge_pnts.append(points)
                    edge_bbox_wcs.append(get_bbox(shape, edge))
        
        edge_explorer.Next()
    
    # Extract vertex points
    while vertex_explorer.More():
        vertex = topods.Vertex(vertex_explorer.Current())
        pnt = BRep_Tool.Pnt(vertex)
        corner_pnts.append([pnt.X(), pnt.Y(), pnt.Z()])
        vertex_explorer.Next()
    
    # 获取邻接信息
    edgeFace_adj, faceEdge_adj, edgeCorner_adj = get_adjacency_info(shape)
    
    # 转换为numpy数组，但保持列表形式
    face_pnts = list(face_pnts)  # 确保是列表
    edge_pnts = list(edge_pnts)  # 确保是列表
    corner_pnts = np.array(corner_pnts, dtype=np.float32)
    surf_bbox_wcs = np.array(surf_bbox_wcs, dtype=np.float32)
    edge_bbox_wcs = np.array(edge_bbox_wcs, dtype=np.float32)
    
    # Normalize the CAD model
    surfs_wcs, edges_wcs, surfs_ncs, edges_ncs, corner_wcs = normalize(face_pnts, edge_pnts, corner_pnts)
    
    # Create result dictionary
    data = {
        'surf_wcs': surfs_wcs,
        'edge_wcs': edges_wcs,
        'surf_ncs': surfs_ncs,
        'edge_ncs': edges_ncs,
        'corner_wcs': corner_wcs.astype(np.float32),
        'edgeFace_adj': edgeFace_adj,
        'edgeCorner_adj': edgeCorner_adj,
        'faceEdge_adj': faceEdge_adj,
        'surf_bbox_wcs': surf_bbox_wcs,
        'edge_bbox_wcs': edge_bbox_wcs,
        'corner_unique': np.unique(corner_wcs, axis=0).astype(np.float32)
    }
    
    return data

def load_step(step_path):
    """Load STEP file and return solids"""
    reader = STEPControl_Reader()
    reader.ReadFile(step_path)
    reader.TransferRoots()
    return [reader.OneShape()]

def process_single_step(
    step_path:str, 
    output_path:str=None, 
    timeout:int=300
) -> dict:
    """Process single STEP file"""
    try:
        # 解析STEP文件
        data = parse_solid(step_path)
        if data is None:
            logger.error("Failed to parse STEP file")
            return None
        # 保存结果
        if output_path:
            try:
                logger.info(f"Saving results to: {output_path}")
                os.makedirs(os.path.dirname(output_path), exist_ok=True)
                with open(output_path, 'wb') as f:
                    pickle.dump(data, f)
                logger.info("Results saved successfully")
            except Exception as e:
                logger.error(f'Not saving due to error: {str(e)}')
        
        return data
    except Exception as e:
        logger.error(f'Not saving due to error: {str(e)}')
        return 0

def test(step_file_path, output_path=None):
    """
    测试函数：转换单个STEP文件并保存结果
    """
    try:
        logger.info(f"Processing STEP file: {step_file_path}")
        
        # 解析STEP文件
        data = parse_solid(step_file_path)
        if data is None:
            logger.error("Failed to parse STEP file")
            return None
            
        # 打印统计信息
        logger.info("\nStatistics:")
        logger.info(f"Number of surfaces: {len(data['surf_wcs'])}")
        logger.info(f"Number of edges: {len(data['edge_wcs'])}")
        logger.info(f"Number of corners: {len(data['corner_unique'])}")
        
        # 保存结果
        if output_path:
            logger.info(f"Saving results to: {output_path}")
            os.makedirs(os.path.dirname(output_path), exist_ok=True)
            with open(output_path, 'wb') as f:
                pickle.dump(data, f)
            logger.info("Results saved successfully")
            
        return data
        
    except Exception as e:
        logger.error(f"Error processing STEP file: {str(e)}")
        return None

def process_furniture_step(data_path):
    """
    处理家具数据集的STEP文件

    参数:
        data_path: 数据集路径
    
    返回:
        包含训练、验证和测试集的STEP文件路径字典
        {
            'train': [step_file_path1, step_file_path2, ...],
            'val': [step_file_path1, step_file_path2, ...],
            'test': [step_file_path1, step_file_path2, ...]
        }
    """

    step_dirs = {}
    for split in ['train', 'val', 'test']:
        tmp_step_dirs = []
        split_path = os.path.join(data_path, split)
        if os.path.exists(split_path):
            for f in os.listdir(split_path):
                if f.endswith('.step'):
                    tmp_step_dirs.append(f)
        step_dirs[split] = tmp_step_dirs
    return step_dirs


def main():
    """
    主函数：处理多个STEP文件
    """
    # 定义路径常量
    INPUT = '/mnt/disk2/dataset/furniture/step/furniture_dataset_step/'
    OUTPUT = 'test_data/pkl/'
    RESULT = 'test_data/result/'  # 用于存储成功/失败文件记录
    
    # 确保输出目录存在
    os.makedirs(OUTPUT, exist_ok=True)
    os.makedirs(RESULT, exist_ok=True)
    
    # 获取所有STEP文件
    step_dirs_dict = process_furniture_step(INPUT)
    total_processed = 0
    total_success = 0
    
    # 按数据集分割处理文件
    for split in ['train', 'val', 'test']:
        current_step_dirs = step_dirs_dict[split]
        if not current_step_dirs:
            logger.warning(f"No files found in {split} split")
            continue
            
        # 确保分割目录存在
        split_output_dir = os.path.join(OUTPUT, split)
        split_result_dir = os.path.join(RESULT, split)
        os.makedirs(split_output_dir, exist_ok=True)
        os.makedirs(split_result_dir, exist_ok=True)
        
        success_files = []  # 存储成功处理的文件名
        failed_files = []   # 存储失败的文件名及原因
        
        # 并行处理文件
        with ProcessPoolExecutor(max_workers=os.cpu_count() // 2) as executor:
            futures = {}
            for step_file in current_step_dirs:
                input_path = os.path.join(INPUT, split, step_file)
                output_path = os.path.join(split_output_dir, step_file.replace('.step', '.pkl'))
                future = executor.submit(process_single_step, input_path, output_path, timeout=300)
                futures[future] = step_file
            
            # 处理结果
            for future in tqdm(as_completed(futures), total=len(current_step_dirs), 
                             desc=f"Processing {split} set"):
                try:
                    status = future.result(timeout=300)
                    if status is not None:
                        success_files.append(futures[future])
                        total_success += 1
                except TimeoutError:
                    logger.error(f"Timeout occurred while processing {futures[future]}")
                    failed_files.append((futures[future], "Timeout"))
                except Exception as e:
                    logger.error(f"Error processing {futures[future]}: {str(e)}")
                    failed_files.append((futures[future], str(e)))
                finally:
                    total_processed += 1
            
            # 保存成功文件列表
            success_file_path = os.path.join(split_result_dir, 'success.txt')
            with open(success_file_path, 'w', encoding='utf-8') as f:
                f.write('\n'.join(success_files))
            logger.info(f"Saved {len(success_files)} successful files to {success_file_path}")
            
            # 保存失败文件列表（包含错误信息）
            failed_file_path = os.path.join(split_result_dir, 'failed.txt')
            with open(failed_file_path, 'w', encoding='utf-8') as f:
                for file, error in failed_files:
                    f.write(f"{file}: {error}\n")
            logger.info(f"Saved {len(failed_files)} failed files to {failed_file_path}")
    
    # 打印最终统计信息
    if total_processed > 0:
        success_rate = (total_success / total_processed) * 100
        logger.info(f"Processing completed:")
        logger.info(f"Total files processed: {total_processed}")
        logger.info(f"Successfully processed: {total_success}")
        logger.info(f"Success rate: {success_rate:.2f}%")
    else:
        logger.warning("No files were processed")

if __name__ == '__main__':
    main()