P3-SAM

张

张建站

2026/6/9 4:46:10

10分钟阅读

预览特征import os import sys import torch import torch.nn as nn import numpy as np import argparse import viser import trimesh # codingutf-8 import sys import os current_dir os.path.dirname(os.path.abspath(__file__)) os.chdir(current_dir) print(current_dir, current_dir) paths [current_dir, current_dir/../] paths.append(/data/lbg/project/hunyuan/Hunyuan3D-Part/P3-SAM) for path in paths: sys.path.insert(0, path) os.environ[PYTHONPATH] (os.environ.get(PYTHONPATH, ) : path).strip(:) from sklearn.decomposition import PCA import time sys.path.append(..) from model import build_P3SAM, load_state_dict class P3SAM(nn.Module): def __init__(self): super().__init__() build_P3SAM(self) def load_state_dict(self, ckpt_pathNone, state_dictNone, strictTrue, assignFalse, ignore_seg_mlpFalse, ignore_seg_s2_mlpFalse, ignore_iou_mlpFalse): load_state_dict(self, ckpt_pathckpt_path, state_dictstate_dict, strictstrict, assignassign, ignore_seg_mlpignore_seg_mlp, ignore_seg_s2_mlpignore_seg_s2_mlp, ignore_iou_mlpignore_iou_mlp) POINT_COLOR np.array([255, 153, 153]) POINT_SIZE 0.001 PROMPT_COLOR np.array([0, 255, 0]) MASK_COLOR np.array([0, 0, 255]) def normalize_pc(pc): pc: (N, 3) max_, min_ np.max(pc, axis0), np.min(pc, axis0) center (max_ min_) / 2 scale (max_ - min_) / 2 scale np.max(np.abs(scale)) pc (pc - center) / (scale 1e-10) return pc torch.no_grad() def get_feat(model, points, normals): data_dict { coord: points, normal: normals, color: np.ones_like(points), batch: np.zeros(points.shape[0], dtypenp.int64) } data_dict model.transform(data_dict) for k in data_dict: if isinstance(data_dict[k], torch.Tensor): data_dict[k] data_dict[k].cuda() point model.sonata(data_dict) while pooling_parent in point.keys(): assert pooling_inverse in point.keys() parent point.pop(pooling_parent) inverse point.pop(pooling_inverse) parent.feat torch.cat([parent.feat, point.feat[inverse]], dim-1) point parent feat point.feat # [M, 1232] feat model.mlp(feat) # [M, 512] feat feat[point.inverse] # [N, 512] feats feat return feats torch.no_grad() def get_mask(model, feats, points, point_prompt): point_num points.shape[0] points torch.from_numpy(points).float().cuda() # [N, 3] prompt_coord torch.from_numpy(point_prompt).float().cuda().unsqueeze(0) # [1, 3] prompt_coord prompt_coord.repeat(point_num, 1) # [N, 3] feats_seg torch.cat([feats, points, prompt_coord], dim-1) # [N, 51233] # 预测mask stage-1 pred_mask_1 model.seg_mlp_1(feats_seg).squeeze(-1) # [N] pred_mask_2 model.seg_mlp_2(feats_seg).squeeze(-1) # [N] pred_mask_3 model.seg_mlp_3(feats_seg).squeeze(-1) # [N] pred_mask torch.stack([pred_mask_1, pred_mask_2, pred_mask_3], dim-1) # [N, 3] # 预测mask stage-2 feats_seg_2 torch.cat([feats_seg, pred_mask], dim-1) # [N, 512333] feats_seg_global model.seg_s2_mlp_g(feats_seg_2) # [N, 512] feats_seg_global torch.max(feats_seg_global, dim0).values # [512] feats_seg_global feats_seg_global.unsqueeze(0).repeat(point_num, 1) # [N, 512] feats_seg_3 torch.cat([feats_seg_global, feats_seg_2], dim-1) # [N, 512333512] pred_mask_s2_1 model.seg_s2_mlp_1(feats_seg_3).squeeze(-1) # [N] pred_mask_s2_2 model.seg_s2_mlp_2(feats_seg_3).squeeze(-1) # [N] pred_mask_s2_3 model.seg_s2_mlp_3(feats_seg_3).squeeze(-1) # [N] pred_mask_s2 torch.stack([pred_mask_s2_1, pred_mask_s2_2, pred_mask_s2_3], dim-1) # [N, 3] mask_1 torch.sigmoid(pred_mask_s2_1) mask_2 torch.sigmoid(pred_mask_s2_2) mask_3 torch.sigmoid(pred_mask_s2_3) mask_1 mask_1.detach().cpu().numpy() 0.5 mask_2 mask_2.detach().cpu().numpy() 0.5 mask_3 mask_3.detach().cpu().numpy() 0.5 print(feats_seg.shape, pred_mask.shape) feats_iou torch.cat([feats_seg_global, feats_seg, pred_mask_s2], dim-1) # [N, 512333512] feats_iou model.iou_mlp(feats_iou) # [N, 512] feats_iou torch.max(feats_iou, dim0).values # [512] pred_iou model.iou_mlp_out(feats_iou) # [3] pred_iou torch.sigmoid(pred_iou) # [3] org_iou pred_iou.detach().cpu().numpy() # [3] org_iou_1 org_iou[0].item() org_iou_2 org_iou[1].item() org_iou_3 org_iou[2].item() pred_iou_1 org_iou_1 pred_iou_2 org_iou_2 pred_iou_3 org_iou_3 return mask_1, mask_2, mask_3, pred_iou_1, pred_iou_2, pred_iou_3, org_iou_1, org_iou_2, org_iou_3 def mask2color(mask): point_num mask.shape[0] colors np.expand_dims(POINT_COLOR, axis0) colors np.tile(colors, (point_num, 1)) colors[mask] MASK_COLOR return colors def main(args): # load model print(加载模型) model P3SAM() model.load_state_dict(args.ckpt_path) model.eval() model.cuda() print(模型加载完成) print(加载数据列表) data_list os.listdir(args.data_dir) print(f共加载{len(data_list)}个数据) server viser.ViserServer(hostargs.host, portargs.port) server.scene.set_up_direction(y) if args.data_dir is None: if args.data_id in data_list: data_list.remove(args.data_id) data_list.insert(0, args.data_id) cur_data_id [data_list[0]] points [None] points_handle [None] colors_pca [None] feats [None] show_colors [None] point_prompt [None] mask_res [None, None, None] iou_res [None, None, None] iou_org [None, None, None] best [None] def remove_point_prompt(): if point_prompt[0] is not None: server.scene.remove_by_name(f/sphere) point_prompt[0] None def clear_state(): mask_res[0] None mask_res[1] None mask_res[2] None iou_res[0] None iou_res[1] None iou_res[2] None iou_org[0] None iou_org[1] None iou_org[2] None best[0] None remove_point_prompt() def load_pc(use_normalTrue, noise_std0): clear_state() print(加载数据) if args.data_dir is not None: glb_data_path os.path.join(args.data_dir, cur_data_id[0]) else: glb_data_path os.path.join(args.data_root, cur_data_id[0], pure_mesh.glb) if glb_data_path.endswith(.glb) or glb_data_path.endswith(.obj): mesh trimesh.load(glb_data_path, forcemesh, processFalse) _points, face_idx trimesh.sample.sample_surface(mesh, args.point_num) _points normalize_pc(_points) _points _points np.random.normal(0, 1, size_points.shape) * noise_std normals mesh.face_normals[face_idx] if not use_normal or args.no_normal: normals normals * 0 else: raise ValueError(fUnsupported file type: {glb_data_path}) show_color np.array([POINT_COLOR]) _show_colors np.tile(show_color, (_points.shape[0], 1)) print(预处理特征) _feats get_feat(model, _points, normals) print(PCA获取特征颜色) feat_save _feats.float().detach().cpu().numpy() data_scaled feat_save / np.linalg.norm(feat_save, axis-1, keepdimsTrue) pca PCA(n_components3) data_reduced pca.fit_transform(data_scaled) data_reduced (data_reduced - data_reduced.min()) / (data_reduced.max() - data_reduced.min()) _colors_pca (data_reduced * 255).astype(np.uint8) # add point cloud _points_handle server.scene.add_point_cloud( name/point_cloud, points_points, colors_show_colors, point_sizePOINT_SIZE, ) points[0] _points points_handle[0] _points_handle colors_pca[0] _colors_pca feats[0] _feats show_colors[0] _show_colors print(加载数据完成) load_pc() server.on_client_connect def _(client: viser.ClientHandle) - None: data_list_handle client.gui.add_dropdown( Data ID, data_list ) markdown_handle client.gui.add_markdown( IOU: 1: 0.000, 2: 0.000, 3: 0.000 ) checkbox_handle client.gui.add_checkbox( Show Feature, initial_valueTrue ) _colors_pcacolors_pca[0] points_handle[0].colors _colors_pca print(f总点数: {len(_colors_pca)}) # 1. 严格唯一颜色数每个通道精确相等才算同一种颜色 unique_strict np.unique(_colors_pca.reshape(-1, 3), axis0) print(f严格唯一颜色数: {len(unique_strict)}) # 2. 量化后颜色数粗粒度更接近人眼感知 for level in [4, 8, 16, 32]: quantized (_colors_pca // level) * level unique_quant np.unique(quantized.reshape(-1, 3), axis0) print(f量化间隔{level}时颜色数: {len(unique_quant)}) # 3. 显示主要颜色占比1%的 colors_int _colors_pca.astype(np.int32) unique_colors, counts np.unique(colors_int.reshape(-1, 3), axis0, return_countsTrue) sorted_idx np.argsort(-counts) print(f\n主要颜色占比1%:) for i in range(len(sorted_idx)): idx sorted_idx[i] ratio counts[idx] / len(_colors_pca) * 100 if ratio 1.0: break color unique_colors[idx] print(f RGB({color[0]:3d},{color[1]:3d},{color[2]:3d}) - {counts[idx]:6d}点 ({ratio:.1f}%)) print(*50) def show_mask(): points_handle[0].colors colors_pca[0] checkbox_handle.on_update def _(_): show_mask() while True: time.sleep(1) if __name__ __main__: argparser argparse.ArgumentParser() argparser.add_argument(--ckpt_path, typestr, default/data/lbg/project/hunyuan/Hunyuan3D-Part/P3-SAM/weights/p3sam.safetensors, helppath to continue ckpt) argparser.add_argument(--host, default0.0.0.0, helpHost to bind to) argparser.add_argument(--port, default8000, typeint, helpPort to bind to) argparser.add_argument(--point_num, default60000, typeint, helpNumber of points to sample from the mesh) argparser.add_argument(--data_dir, default./assets, typestr, helpData directory) argparser.add_argument(--no_normal, actionstore_true, helpDo not use normal information) args argparser.parse_args() main(args)

R-GCN代码架构解析：从数据加载到模型训练的完整流程

R-GCN代码架构解析：从数据加载到模型训练的完整流程【免费下载链接】relational-gcn Keras-based implementation of Relational Graph Convolutional Networks 项目地址: https://gitcode.com/gh_mirrors/re/relational-gcn 关系图卷积网络（R-G…...

2026/6/9 4:44:07 阅读更多 →

THULAC用户词典使用教程：自定义分词结果的终极方案

THULAC用户词典使用教程：自定义分词结果的终极方案【免费下载链接】THULAC An Efficient Lexical Analyzer for Chinese 项目地址: https://gitcode.com/gh_mirrors/th/THULAC 想要让中文分词工具THULAC更懂你的专业术语吗？🤔 本文将…...

2026/6/9 4:42:14 阅读更多 →