update

update displaytable rotation
update
2024-10-18 17:13:45 +08:00 · 2024-10-14 19:37:34 +08:00 · 2024-10-13 19:47:05 +08:00 · 2024-10-13 15:24:41 +08:00 · 2024-10-12 23:11:25 +08:00 · 2024-10-12 20:25:55 +08:00
26 changed files with 1836 additions and 33658 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -1,12 +1,15 @@
 # ---> Python
 # Byte-compiled / optimized / DLL files
+test/
 __pycache__/
 *.py[cod]
 *$py.class
-
+test_output/
 # C extensions
 *.so
-
+*.txt
+experiments/
+temp_output/
 # Distribution / packaging
 .Python
 build/
--- a/app_cad.py
+++ b/app_cad.py
@@ -1,9 +1,16 @@
 from PytorchBoot.application import PytorchBootApplication
-from runners.cad_strategy import CADStrategyRunner
+from runners.cad_open_loop_strategy import CADOpenLoopStrategyRunner
+from runners.cad_close_loop_strategy import CADCloseLoopStrategyRunner

-@PytorchBootApplication("cad")
-class AppCAD:
+
+@PytorchBootApplication("cad_ol")
+class AppCADOpenLoopStrategy:
    @staticmethod
    def start():
-        CADStrategyRunner("configs/cad_config.yaml").run()
-        
+        CADOpenLoopStrategyRunner("configs/cad_open_loop_config.yaml").run()
+        
+@PytorchBootApplication("cad_cl")
+class AppCADCloseLoopStrategy:
+    @staticmethod
+    def start():
+        CADCloseLoopStrategyRunner("configs/cad_close_loop_config.yaml").run()
--- a/cam_directions.txt
+++ b/cam_directions.txt
@@ -1,160 +0,0 @@
-2.976360870451021934e-01 2.612396282015549270e-02 2.722307168556427626e-01
-2.807145935740879561e-01 2.344288301708187527e-02 2.619120507693710187e-01
-2.637931001030737743e-01 2.076180321400825785e-02 2.515933846830992748e-01
-2.468716066320595925e-01 1.808072341093463695e-02 2.412747185968275587e-01
-2.299501131610453553e-01 1.539964360786101778e-02 2.309560525105558149e-01
-2.130286196900311735e-01 1.271856380478740209e-02 2.206373864242840988e-01
-1.961071262190169640e-01 1.003748400171378119e-02 2.103187203380123549e-01
-1.791856327480027822e-01 7.356404198640163761e-03 2.000000542517406110e-01
-1.622641392769885726e-01 4.675324395566546332e-03 1.896813881654688672e-01
-1.453426458059743631e-01 1.994244592492925433e-03 1.793627220791971233e-01
-1.058318675876641773e-01 1.913315480742055485e-01 3.701966140390944293e-01
-9.931276171077207948e-02 1.796797252938450440e-01 3.553058019571109782e-01
-9.279365583387996774e-02 1.680279025134845672e-01 3.404149898751275827e-01
-8.627454995698786988e-02 1.563760797331240904e-01 3.255241777931441316e-01
-7.975544408009577202e-02 1.447242569527635858e-01 3.106333657111607360e-01
-7.323633820320367416e-02 1.330724341724031090e-01 2.957425536291773405e-01
-6.671723232631157630e-02 1.214206113920426183e-01 2.808517415471938894e-01
-6.019812644941947150e-02 1.097687886116821415e-01 2.659609294652104938e-01
-5.367902057252737363e-02 9.811696583132166471e-02 2.510701173832270983e-01
-4.715991469563526883e-02 8.646514305096116015e-02 2.361793053012436749e-01
-3.921455052209112946e-01 5.125427963019697081e-02 2.092982359830542760e-01
-3.736810423058752328e-01 4.853268829412461099e-02 2.021109868668294895e-01
-3.552165793908391711e-01 4.581109695805224424e-02 1.949237377506047031e-01
-3.367521164758031094e-01 4.308950562197988443e-02 1.877364886343799166e-01
-3.182876535607670476e-01 4.036791428590751768e-02 1.805492395181551302e-01
-2.998231906457310414e-01 3.764632294983515093e-02 1.733619904019303437e-01
-2.813587277306949241e-01 3.492473161376279112e-02 1.661747412857055572e-01
-2.628942648156589179e-01 3.220314027769043130e-02 1.589874921694807708e-01
-2.444298019006228562e-01 2.948154894161806455e-02 1.518002430532560121e-01
-2.259653389855867667e-01 2.675995760554569780e-02 1.446129939370311979e-01
-2.966121428882431688e-01 -1.243668772355264462e-01 2.528267403420925707e-01
-2.794781650275093843e-01 -1.175232445334360720e-01 2.451071876279281303e-01
-2.623441871667755443e-01 -1.106796118313456839e-01 2.373876349137637176e-01
-2.452102093060417598e-01 -1.038359791292553097e-01 2.296680821995992772e-01
-2.280762314453079753e-01 -9.699234642716492161e-02 2.219485294854348645e-01
-2.109422535845741908e-01 -9.014871372507454739e-02 2.142289767712704240e-01
-1.938082757238404064e-01 -8.330508102298417317e-02 2.065094240571059836e-01
-1.766742978631065941e-01 -7.646144832089379895e-02 1.987898713429415709e-01
-1.595403200023728096e-01 -6.961781561880342473e-02 1.910703186287771582e-01
-1.424063421416389974e-01 -6.277418291671303663e-02 1.833507659146127178e-01
-1.516386400982264460e-01 -1.586701464075628287e-01 2.415754089606511334e-01
-1.434280702011365705e-01 -1.455541040346652326e-01 2.289043405590775460e-01
-1.352175003040466672e-01 -1.324380616617676643e-01 2.162332721575039862e-01
-1.270069304069567917e-01 -1.193220192888700681e-01 2.035622037559303987e-01
-1.187963605098669162e-01 -1.062059769159724720e-01 1.908911353543568112e-01
-1.105857906127770407e-01 -9.308993454307488979e-02 1.782200669527832515e-01
-1.023752207156871513e-01 -7.997389217017729368e-02 1.655489985512096363e-01
-9.416465081859727582e-02 -6.685784979727971145e-02 1.528779301496360765e-01
-8.595408092150740031e-02 -5.374180742438212921e-02 1.402068617480624890e-01
-7.774351102441751094e-02 -4.062576505148451922e-02 1.275357933464889015e-01
-1.305310885675468879e-01 -2.574515835723965029e-01 3.302868348637944540e-01
-1.245164210467534782e-01 -2.462217366382081774e-01 3.148688482102455222e-01
-1.185017535259600685e-01 -2.349918897040197963e-01 2.994508615566965903e-01
-1.124870860051666588e-01 -2.237620427698314429e-01 2.840328749031476585e-01
-1.064724184843732491e-01 -2.125321958356430896e-01 2.686148882495986712e-01
-1.004577509635798394e-01 -2.013023489014547363e-01 2.531969015960497393e-01
-9.444308344278641576e-02 -1.900725019672663829e-01 2.377789149425008075e-01
-8.842841592199301992e-02 -1.788426550330780018e-01 2.223609282889518757e-01
-8.241374840119961021e-02 -1.676128080988896762e-01 2.069429416354029438e-01
-7.639908088040618661e-02 -1.563829611647012952e-01 1.915249549818539843e-01
-2.141758616454684239e-01 -1.401142265731682157e-01 3.208142574142802683e-01
-2.034685215614439324e-01 -1.329408282550643694e-01 3.055206239383900790e-01
-1.927611814774194687e-01 -1.257674299369604953e-01 2.902269904624999453e-01
-1.820538413933950050e-01 -1.185940316188566629e-01 2.749333569866098115e-01
-1.713465013093705136e-01 -1.114206333007528027e-01 2.596397235107196777e-01
-1.606391612253460499e-01 -1.042472349826489564e-01 2.443460900348295162e-01
-1.499318211413215862e-01 -9.707383666454511006e-02 2.290524565589393546e-01
-1.392244810572971225e-01 -8.990043834644126375e-02 2.137588230830492209e-01
-1.285171409732726311e-01 -8.272704002833740355e-02 1.984651896071590871e-01
-1.178098008892481535e-01 -7.555364171023355724e-02 1.831715561312689255e-01
-1.002417282812653465e-01 -1.857441582228861743e-01 2.313739119119407606e-01
-9.359755865267997688e-02 -1.758149544613172577e-01 2.153344006161490576e-01
-8.695338902409460724e-02 -1.658857506997483688e-01 1.992948893203573268e-01
-8.030921939550925148e-02 -1.559565469381794800e-01 1.832553780245656239e-01
-7.366504976692386797e-02 -1.460273431766105634e-01 1.672158667287739209e-01
-6.702088013833851221e-02 -1.360981394150416746e-01 1.511763554329821901e-01
-6.037671050975313564e-02 -1.261689356534727580e-01 1.351368441371904594e-01
-5.373254088116777294e-02 -1.162397318919038830e-01 1.190973328413987842e-01
-4.708837125258240330e-02 -1.063105281303349803e-01 1.030578215456070812e-01
-4.044420162399703367e-02 -9.638132436876607756e-02 8.701831024981535045e-02
-1.554821963443976385e-01 -2.148257011199891098e-01 5.250742981755206484e-01
-1.482802959028949041e-01 -2.064840275062017061e-01 5.083845075431692173e-01
-1.410783954613921698e-01 -1.981423538924143024e-01 4.916947169108177862e-01
-1.338764950198894355e-01 -1.898006802786268987e-01 4.750049262784663551e-01
-1.266745945783867011e-01 -1.814590066648394673e-01 4.583151356461149240e-01
-1.194726941368839807e-01 -1.731173330510520636e-01 4.416253450137634928e-01
-1.122707936953812463e-01 -1.647756594372646599e-01 4.249355543814120062e-01
-1.050688932538785120e-01 -1.564339858234772562e-01 4.082457637490606306e-01
-9.786699281237579151e-02 -1.480923122096898525e-01 3.915559731167091995e-01
-9.066509237087304329e-02 -1.397506385959024211e-01 3.748661824843577128e-01
-8.025776028547672303e-02 2.944407235099611442e-01 2.936572800346861634e-01
-7.539005914741314651e-02 2.795810656774440073e-01 2.811874743132241616e-01
-7.052235800934955612e-02 2.647214078449268704e-01 2.687176685917621599e-01
-6.565465687128596572e-02 2.498617500124097057e-01 2.562478628703001582e-01
-6.078695573322238921e-02 2.350020921798925411e-01 2.437780571488381842e-01
-5.591925459515880575e-02 2.201424343473754042e-01 2.313082514273761825e-01
-5.105155345709521536e-02 2.052827765148582673e-01 2.188384457059141808e-01
-4.618385231903163191e-02 1.904231186823411304e-01 2.063686399844521790e-01
-4.131615118096804845e-02 1.755634608498239935e-01 1.938988342629902051e-01
-3.644845004290446500e-02 1.607038030173068288e-01 1.814290285415282034e-01
-5.157790449341418532e-02 -2.280915238559273472e-01 2.331722629466718155e-01
-4.687897960620368565e-02 -2.143414166823043310e-01 2.194298229297667047e-01
-4.218005471899319292e-02 -2.005913095086813147e-01 2.056873829128615938e-01
-3.748112983178270019e-02 -1.868412023350582984e-01 1.919449428959564830e-01
-3.278220494457220052e-02 -1.730910951614352822e-01 1.782025028790513721e-01
-2.808328005736170779e-02 -1.593409879878122659e-01 1.644600628621462890e-01
-2.338435517015120813e-02 -1.455908808141892496e-01 1.507176228452411781e-01
-1.868543028294071540e-02 -1.318407736405662334e-01 1.369751828283360673e-01
-1.398650539573022267e-02 -1.180906664669432449e-01 1.232327428114309703e-01
-9.287580508519722999e-03 -1.043405592933202286e-01 1.094903027945258456e-01
-1.269215451024525432e-01 2.625545655654951682e-01 3.417737734235570812e-01
-1.199871749412033256e-01 2.471706458737163714e-01 3.310383402518738971e-01
-1.130528047799540942e-01 2.317867261819375746e-01 3.203029070801906575e-01
-1.061184346187048627e-01 2.164028064901587500e-01 3.095674739085074179e-01
-9.918406445745564515e-02 2.010188867983799255e-01 2.988320407368242337e-01
-9.224969429620641370e-02 1.856349671066011287e-01 2.880966075651409941e-01
-8.531532413495718226e-02 1.702510474148223041e-01 2.773611743934577545e-01
-7.838095397370795081e-02 1.548671277230435073e-01 2.666257412217745704e-01
-7.144658381245873324e-02 1.394832080312647105e-01 2.558903080500913307e-01
-6.451221365120950180e-02 1.240992883394858581e-01 2.451548748784081189e-01
-2.341853875412766850e-01 5.152039859854373044e-02 5.197893180168721150e-01
-2.252007148693486449e-01 4.944684319447055498e-02 5.020417541005327555e-01
-2.162160421974206326e-01 4.737328779039738647e-02 4.842941901841934516e-01
-2.072313695254926202e-01 4.529973238632421795e-02 4.665466262678541476e-01
-1.982466968535646079e-01 4.322617698225104943e-02 4.487990623515148436e-01
-1.892620241816365678e-01 4.115262157817788091e-02 4.310514984351755396e-01
-1.802773515097085555e-01 3.907906617410470546e-02 4.133039345188362357e-01
-1.712926788377805432e-01 3.700551077003153000e-02 3.955563706024969317e-01
-1.623080061658525031e-01 3.493195536595836148e-02 3.778088066861576833e-01
-1.533233334939244907e-01 3.285839996188519296e-02 3.600612427698183238e-01
-1.210235277878131122e-01 -3.921239465826816817e-01 2.952365626755736328e-01
-1.155743475904795203e-01 -3.762006607063697050e-01 2.844312213076097273e-01
-1.101251673931459424e-01 -3.602773748300577838e-01 2.736258799396458774e-01
-1.046759871958123506e-01 -3.443540889537458072e-01 2.628205385716819720e-01
-9.922680699847875874e-02 -3.284308030774338305e-01 2.520151972037181221e-01
-9.377762680114518079e-02 -3.125075172011218538e-01 2.412098558357542721e-01
-8.832844660381158897e-02 -2.965842313248098772e-01 2.304045144677903667e-01
-8.287926640647799714e-02 -2.806609454484979560e-01 2.195991730998265168e-01
-7.743008620914440532e-02 -2.647376595721859793e-01 2.087938317318626391e-01
-7.198090601181081349e-02 -2.488143736958740027e-01 1.979884903638987614e-01
-7.634513431648837223e-02 1.841063024461145892e-01 3.127523209464129761e-01
-7.178553403421568391e-02 1.753640395784209771e-01 2.953516633376314648e-01
-6.722593375194299559e-02 1.666217767107273651e-01 2.779510057288500091e-01
-6.266633346967032114e-02 1.578795138430337808e-01 2.605503481200685534e-01
-5.810673318739763282e-02 1.491372509753401687e-01 2.431496905112870421e-01
-5.354713290512495838e-02 1.403949881076465844e-01 2.257490329025055864e-01
-4.898753262285227006e-02 1.316527252399529724e-01 2.083483752937241029e-01
-4.442793234057959562e-02 1.229104623722593881e-01 1.909477176849426472e-01
-3.986833205830691423e-02 1.141681995045657899e-01 1.735470600761611637e-01
-3.530873177603422591e-02 1.054259366368721779e-01 1.561464024673796802e-01
-2.097103305076620516e-01 -1.384789009505066615e-01 2.811056276500599749e-01
-1.943908481741861705e-01 -1.318322337484758855e-01 2.700994804522541815e-01
-1.790713658407102893e-01 -1.251855665464451373e-01 2.590933332544483880e-01
-1.637518835072344081e-01 -1.185388993444143890e-01 2.480871860566425391e-01
-1.484324011737584992e-01 -1.118922321423836130e-01 2.370810388588367179e-01
-1.331129188402826458e-01 -1.052455649403528648e-01 2.260748916610308967e-01
-1.177934365068067368e-01 -9.859889773832210269e-02 2.150687444632250478e-01
-1.024739541733308557e-01 -9.195223053629135446e-02 2.040625972654192544e-01
-8.715447183985497448e-02 -8.530556333426059235e-02 1.930564500676134332e-01
-7.183498950637906555e-02 -7.865889613222983023e-02 1.820503028698076120e-01
--- a/cam_poses.txt
+++ b/cam_poses.txt
@@ -1,16 +0,0 @@
-3.145575805161163752e-01 2.880504262322911013e-02 2.825493829419145064e-01
-1.123509734645562752e-01 2.029833708545660254e-01 3.850874261210778249e-01
-4.106099681359473563e-01 5.397587096626933756e-02 2.164854850992790625e-01
-3.137461207489769532e-01 -1.312105099376168205e-01 2.605462930562569834e-01
-1.598492099953163215e-01 -1.717861887804604248e-01 2.542464773622247209e-01
-1.365457560883402977e-01 -2.686814305065848840e-01 3.457048215173433858e-01
-2.248832017294928876e-01 -1.472876248912720620e-01 3.361078908901704021e-01
-1.068858979098507161e-01 -1.956733619844550631e-01 2.474134232077324635e-01
-1.626840967859003728e-01 -2.231673747337765135e-01 5.417640888078720796e-01
-8.512546142354031342e-02 3.093003813424782811e-01 3.061270857561481651e-01
-5.627682938062467805e-02 -2.418416310295503635e-01 2.469147029635769264e-01
-1.338559152637017746e-01 2.779384852572739928e-01 3.525092065952403209e-01
-2.431700602132046973e-01 5.359395400261689896e-02 5.375368819332113635e-01
-1.264727079851467040e-01 -4.080472324589936584e-01 3.060419040435374827e-01
-8.090473459876104667e-02 1.928485653138081735e-01 3.301529785551944318e-01
-2.250298128411379328e-01 -1.451255681525374097e-01 2.921117748478658238e-01
--- a/combine_all_pts.py
+++ b/combine_all_pts.py
@@ -0,0 +1,15 @@
+import numpy as np
+import os
+
+if __name__ == "__main__":
+    pts_dir_path = "/home/yan20/nbv_rec/project/franka_control/temp_output/cad_model_world/pts"
+    pts_dir = os.listdir(pts_dir_path)
+    pts_list = []
+    for i in range(len(pts_dir)):
+        pts_path = os.path.join(pts_dir_path, pts_dir[i])
+        pts = np.loadtxt(pts_path)
+        pts_list.append(pts)
+    combined_pts = np.vstack(pts_list)
+    path = "/home/yan20/nbv_rec/project/franka_control"
+    np.savetxt(os.path.join(path, "combined_pts.txt"), combined_pts)
+    
--- a/configs/cad_close_loop_config.yaml
+++ b/configs/cad_close_loop_config.yaml
@@ -0,0 +1,46 @@
+
+runner:
+  general:
+    seed: 1
+    device: cpu
+    cuda_visible_devices: "0,1,2,3,4,5,6,7"
+    
+  experiment:
+    name: debug
+    root_dir: "experiments"
+  
+  generate:
+    blender_bin_path: /home/yan20/Desktop/nbv_rec/project/blender_app/blender-4.2.2-linux-x64/blender
+    generator_script_path: /home/yan20/Desktop/nbv_rec/project/blender_app/data_generator.py
+    model_dir: "/home/yan20/Desktop/nbv_rec/data/models"
+    table_model_path: "/home/yan20/Desktop/nbv_rec/data/table.obj"
+    model_start_idx: 0
+    voxel_size: 0.002
+    max_shot_view_num: 50
+    min_shot_new_pts_num: 10
+    min_coverage_increase: 0.001  
+    max_view: 64
+    min_view: 32
+    max_diag: 0.7
+    min_diag: 0.01
+    random_view_ratio: 0
+    min_cam_table_included_degree: 20
+    obj_name: "bear"
+    light_and_camera_config:
+      Camera:
+        near_plane: 0.01
+        far_plane: 5
+        fov_vertical: 25
+        resolution: [640,400]
+        eye_distance: 0.15
+        eye_angle: 25
+      Light:
+        location: [0,0,3.5]
+        orientation: [0,0,0]
+        power: 150
+
+  reconstruct:
+    soft_overlap_threshold: 0.3
+    hard_overlap_threshold: 0.6
+    scan_points_threshold: 10
+ 
--- a/configs/cad_config.yaml
+++ b/configs/cad_config.yaml
@@ -1,27 +0,0 @@
-
-runner:
-  general:
-    seed: 1
-    device: cpu
-    cuda_visible_devices: "0,1,2,3,4,5,6,7"
-    
-  experiment:
-    name: debug
-    root_dir: "experiments"
-  
-  generate:
-    model_dir: "/home/yan20/nbv_rec/data/test_CAD/test_model"
-    model_start_idx: 0
-    voxel_size: 0.005
-    max_view: 512
-    min_view: 128
-    max_diag: 0.7
-    min_diag: 0.01
-    random_view_ratio: 0
-    min_cam_table_included_degree: 20
-
-  reconstruct:
-    soft_overlap_threshold: 0.3
-    hard_overlap_threshold: 0.6
-    scan_points_threshold: 10
- 
--- a/configs/cad_open_loop_config.yaml
+++ b/configs/cad_open_loop_config.yaml
@@ -0,0 +1,43 @@
+
+runner:
+  general:
+    seed: 1
+    device: cpu
+    cuda_visible_devices: "0,1,2,3,4,5,6,7"
+    
+  experiment:
+    name: debug
+    root_dir: "experiments"
+  
+  generate:
+    blender_bin_path: /home/yan20/Desktop/nbv_rec/project/blender_app/blender-4.2.2-linux-x64/blender
+    generator_script_path: /home/yan20/Desktop/nbv_rec/project/blender_app/data_generator.py
+    model_dir: "/home/yan20/Desktop/nbv_rec/data/models"
+    table_model_path: "/home/yan20/Desktop/nbv_rec/data/table.obj"
+    model_start_idx: 0
+    voxel_size: 0.002
+    max_view: 512
+    min_view: 128
+    max_diag: 0.7
+    min_diag: 0.01
+    random_view_ratio: 0
+    min_cam_table_included_degree: 20
+    obj_name: "bear"
+    light_and_camera_config:
+      Camera:
+        near_plane: 0.01
+        far_plane: 5
+        fov_vertical: 25
+        resolution: [640,400]
+        eye_distance: 0.15
+        eye_angle: 25
+      Light:
+        location: [0,0,3.5]
+        orientation: [0,0,0]
+        power: 150
+
+  reconstruct:
+    soft_overlap_threshold: 0.3
+    hard_overlap_threshold: 0.6
+    scan_points_threshold: 10
+ 
--- a/configs/render_config.yaml
+++ b/configs/render_config.yaml
@@ -1,23 +0,0 @@
-
-runner:
-  general:
-    seed: 1
-    device: cpu
-    cuda_visible_devices: "0,1,2,3,4,5,6,7"
-    
-  experiment:
-    name: debug
-    root_dir: "experiments"
-  
-  web:
-    host: “0.0.0.0”
-    port: 11111
-  render:
-    model_dir: "/home/yan20/nbv_rec/data/test_CAD/test_model"
-    
-
-  reconstruct:
-    soft_overlap_threshold: 0.3
-    hard_overlap_threshold: 0.6
-    scan_points_threshold: 10
- 
--- a/load_normal.py
+++ b/load_normal.py
@@ -0,0 +1,49 @@
+import cv2
+import os
+import numpy as np
+
+def load_normal(path, binocular=False, left_only=False):
+    if binocular and not left_only:
+        normal_path_L = os.path.join(
+            os.path.dirname(path), "normal", os.path.basename(path) + "_L.png"
+        )
+        normal_image_L = cv2.imread(normal_path_L, cv2.IMREAD_UNCHANGED)
+        normal_path_R = os.path.join(
+            os.path.dirname(path), "normal", os.path.basename(path) + "_R.png"
+        )
+        normal_image_R = cv2.imread(normal_path_R, cv2.IMREAD_UNCHANGED)
+        normalized_normal_image_L = normal_image_L / 255.0 * 2.0 - 1.0
+        normalized_normal_image_R = normal_image_R / 255.0 * 2.0 - 1.0
+        return normalized_normal_image_L, normalized_normal_image_R
+    else:
+        if binocular and left_only:
+            normal_path = os.path.join(
+                os.path.dirname(path), "normal", os.path.basename(path) + "_L.png"
+            )
+        else:
+            normal_path = os.path.join(
+                os.path.dirname(path), "normal", os.path.basename(path) + ".png"
+            )
+        normal_image = cv2.imread(normal_path, cv2.IMREAD_UNCHANGED)
+        normalized_normal_image = normal_image / 255.0 * 2.0 - 1.0
+        return normalized_normal_image
+
+def show_rgb(event, x, y, flags, param):
+    if event == cv2.EVENT_MOUSEMOVE:
+        pixel_value = param[y, x]
+        print(f"RGB at ({x},{y}): {pixel_value}")
+
+if __name__ == "__main__":
+    path = "/Users/hofee/temp/1"
+    normal_image = load_normal(path, binocular=True, left_only=True)
+    display_image = ((normal_image + 1.0) / 2.0 * 255).astype(np.uint8)
+
+    cv2.namedWindow("Normal Image")
+    cv2.setMouseCallback("Normal Image", show_rgb, param=display_image)
+
+    while True:
+        cv2.imshow("Normal Image", display_image)
+        if cv2.waitKey(1) & 0xFF == ord('q'):
+            break
+
+    cv2.destroyAllWindows()
--- a/mesh_point_cloud.txt
+++ b/mesh_point_cloud.txt
--- a/runners/cad_close_loop_strategy.py
+++ b/runners/cad_close_loop_strategy.py
@@ -0,0 +1,244 @@
+import os
+import time
+import trimesh
+import tempfile
+import subprocess
+import numpy as np
+from PytorchBoot.runners.runner import Runner
+from PytorchBoot.config import ConfigManager
+import PytorchBoot.stereotype as stereotype
+from PytorchBoot.utils.log_util import Log
+from PytorchBoot.status import status_manager
+
+from utils.control_util import ControlUtil
+from utils.communicate_util import CommunicateUtil
+from utils.pts_util import PtsUtil
+from utils.reconstruction_util import ReconstructionUtil
+from utils.preprocess_util import save_scene_data, save_scene_data_multithread
+from utils.data_load import DataLoadUtil
+from utils.view_util import ViewUtil
+
+
+@stereotype.runner("CAD_close_loop_strategy_runner")
+class CADCloseLoopStrategyRunner(Runner):
+
+    def __init__(self, config_path: str):
+        super().__init__(config_path)
+        self.load_experiment("cad_strategy")
+        self.status_info = {
+            "status_manager": status_manager,
+            "app_name": "cad",
+            "runner_name": "CAD_close_loop_strategy_runner",
+        }
+        self.generate_config = ConfigManager.get("runner", "generate")
+        self.reconstruct_config = ConfigManager.get("runner", "reconstruct")
+        self.blender_bin_path = self.generate_config["blender_bin_path"]
+        self.generator_script_path = self.generate_config["generator_script_path"]
+        self.model_dir = self.generate_config["model_dir"]
+        self.voxel_size = self.generate_config["voxel_size"]
+        self.max_view = self.generate_config["max_view"]
+        self.min_view = self.generate_config["min_view"]
+        self.max_diag = self.generate_config["max_diag"]
+        self.min_diag = self.generate_config["min_diag"]
+        self.min_cam_table_included_degree = self.generate_config[
+            "min_cam_table_included_degree"
+        ]
+        self.max_shot_view_num = self.generate_config["max_shot_view_num"]
+        self.min_shot_new_pts_num = self.generate_config["min_shot_new_pts_num"]
+        self.min_coverage_increase = self.generate_config["min_coverage_increase"]
+        
+        self.random_view_ratio = self.generate_config["random_view_ratio"]
+
+        self.soft_overlap_threshold = self.reconstruct_config["soft_overlap_threshold"]
+        self.hard_overlap_threshold = self.reconstruct_config["hard_overlap_threshold"]
+        self.scan_points_threshold = self.reconstruct_config["scan_points_threshold"]
+
+    def create_experiment(self, backup_name=None):
+        super().create_experiment(backup_name)
+
+    def load_experiment(self, backup_name=None):
+        super().load_experiment(backup_name)
+
+    def split_scan_pts_and_obj_pts(self, world_pts, z_threshold=0):
+        scan_pts = world_pts[world_pts[:, 2] < z_threshold]
+        obj_pts = world_pts[world_pts[:, 2] >= z_threshold]
+        return scan_pts, obj_pts
+
+    def run_one_model(self, model_name):
+        temp_dir = "/home/yan20/nbv_rec/project/franka_control/temp_output"
+        ControlUtil.connect_robot()
+        """ init robot """
+        Log.info("[Part 1/5] start init and register")
+        ControlUtil.init()
+
+        """ load CAD model """
+        model_path = os.path.join(self.model_dir, model_name, "mesh.ply")
+        temp_name = "cad_model_world"
+        cad_model = trimesh.load(model_path)
+        """ take first view """
+        Log.info("[Part 1/5] take first view data")
+        view_data = CommunicateUtil.get_view_data(init=True)
+        first_cam_pts = ViewUtil.get_pts(view_data)
+        first_cam_to_real_world = ControlUtil.get_pose()
+        first_real_world_pts = PtsUtil.transform_point_cloud(
+            first_cam_pts, first_cam_to_real_world
+        )
+        _, first_splitted_real_world_pts = self.split_scan_pts_and_obj_pts(
+            first_real_world_pts
+        )
+        np.savetxt(f"first_real_pts_{model_name}.txt", first_splitted_real_world_pts)
+        """ register """
+        Log.info("[Part 1/4] do registeration")
+        real_world_to_cad = PtsUtil.register(first_splitted_real_world_pts, cad_model)
+        cad_to_real_world = np.linalg.inv(real_world_to_cad)
+        Log.success("[Part 1/4] finish init and register")
+        real_world_to_blender_world = np.eye(4)
+        real_world_to_blender_world[:3, 3] = np.asarray([0, 0, 0.9215])
+        cad_model_real_world: trimesh.Trimesh = cad_model.apply_transform(
+            cad_to_real_world
+        )
+        cad_model_real_world.export(
+            os.path.join(temp_dir, f"real_world_{temp_name}.obj")
+        )
+        cad_model_blender_world: trimesh.Trimesh = cad_model.apply_transform(
+            real_world_to_blender_world
+        )
+
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_dir = "/home/yan20/nbv_rec/project/franka_control/temp_output"
+            cad_model_blender_world.export(os.path.join(temp_dir, f"{temp_name}.obj"))
+            """ sample view """
+            Log.info("[Part 2/4] start running renderer")
+            subprocess.run(
+                [
+                    self.blender_bin_path,
+                    "-b",
+                    "-P",
+                    self.generator_script_path,
+                    "--",
+                    temp_dir,
+                ],
+                capture_output=True,
+                text=True,
+            )
+            Log.success("[Part 2/4] finish running renderer")
+            
+            """ preprocess """
+            Log.info("[Part 3/4] start preprocessing data")
+            save_scene_data(temp_dir, temp_name)
+            Log.success("[Part 3/4] finish preprocessing data")
+
+            pts_dir = os.path.join(temp_dir, temp_name, "pts")
+            sample_view_pts_list = []
+            scan_points_idx_list = []
+            frame_num = len(os.listdir(pts_dir))
+            for frame_idx in range(frame_num):
+                pts_path = os.path.join(temp_dir, temp_name, "pts", f"{frame_idx}.txt")
+                idx_path = os.path.join(
+                    temp_dir, temp_name, "scan_points_indices", f"{frame_idx}.npy"
+                )
+                point_cloud = np.loadtxt(pts_path)
+                if point_cloud.shape[0] != 0:
+                    sampled_point_cloud = PtsUtil.voxel_downsample_point_cloud(
+                        point_cloud, self.voxel_size
+                    )
+                indices = np.load(idx_path)
+                try:
+                    len(indices)
+                except:
+                    indices = np.array([indices])
+                sample_view_pts_list.append(sampled_point_cloud)
+                scan_points_idx_list.append(indices)
+
+            """ close-loop strategy """
+            scanned_pts = PtsUtil.voxel_downsample_point_cloud(
+                first_splitted_real_world_pts, self.voxel_size
+            )
+            shot_pts_list = [first_splitted_real_world_pts]
+            history_indices = []
+            last_coverage = 0
+            Log.info("[Part 4/4] start close-loop control")
+            cnt = 0
+            while True:
+                #import ipdb; ipdb.set_trace()
+                next_best_view, next_best_coverage, next_best_covered_num = (
+                    ReconstructionUtil.compute_next_best_view_with_overlap(
+                        scanned_pts,
+                        sample_view_pts_list,
+                        history_indices,
+                        scan_points_idx_list,
+                        threshold=self.voxel_size,
+                        overlap_area_threshold=25,
+                        scan_points_threshold=self.scan_points_threshold,
+                    )
+                )
+                nbv_path = DataLoadUtil.get_path(temp_dir, temp_name, next_best_view)
+                nbv_cam_info = DataLoadUtil.load_cam_info(nbv_path, binocular=True)
+                nbv_cam_to_world = nbv_cam_info["cam_to_world_O"]
+                ControlUtil.move_to(nbv_cam_to_world)
+                ''' get world pts '''
+                time.sleep(0.5)
+                view_data = CommunicateUtil.get_view_data()
+                if view_data is None:
+                    Log.error("No view data received")
+                    continue
+                cam_shot_pts = ViewUtil.get_pts(view_data)
+                world_shot_pts = PtsUtil.transform_point_cloud(
+                    cam_shot_pts, first_cam_to_real_world
+                )
+                _, world_splitted_shot_pts = self.split_scan_pts_and_obj_pts(
+                    world_shot_pts
+                )
+                shot_pts_list.append(world_splitted_shot_pts)
+                
+                debug_dir = os.path.join(temp_dir, "debug")
+                if not os.path.exists(debug_dir):
+                    os.makedirs(debug_dir)
+                np.savetxt(os.path.join(debug_dir,  f"shot_pts_{cnt}.txt"), world_splitted_shot_pts)
+                np.savetxt(os.path.join(debug_dir,  f"render_pts_{cnt}.txt"), sample_view_pts_list[next_best_view])
+                #real_world_to_cad = PtsUtil.register(first_splitted_real_world_pts, cad_model)
+                #import ipdb; ipdb.set_trace()
+                last_scanned_pts_num = scanned_pts.shape[0]
+                new_scanned_pts = PtsUtil.voxel_downsample_point_cloud(
+                    np.vstack([scanned_pts, world_splitted_shot_pts]), self.voxel_size
+                )
+                new_scanned_pts_num = new_scanned_pts.shape[0]
+                history_indices.append(scan_points_idx_list[next_best_view])
+                scanned_pts = new_scanned_pts
+                Log.info(
+                    f"Next Best cover pts: {next_best_covered_num}, Best coverage: {next_best_coverage}"
+                )
+                
+                coverage_rate_increase = next_best_coverage - last_coverage
+                if coverage_rate_increase < self.min_coverage_increase:
+                    Log.info(f"Coverage rate = {coverage_rate_increase} < {self.min_coverage_increase}, stop scanning")
+                    # break
+                last_coverage = next_best_coverage
+                
+                new_added_pts_num = new_scanned_pts_num - last_scanned_pts_num
+                if new_added_pts_num < self.min_shot_new_pts_num:
+                    Log.info(f"New added pts num = {new_added_pts_num} < {self.min_shot_new_pts_num}")
+                    #ipdb.set_trace()
+                if len(shot_pts_list) >= self.max_shot_view_num:
+                    Log.info(f"Scanned view num = {len(shot_pts_list)} >= {self.max_shot_view_num}, stop scanning")
+                    #break
+                cnt += 1
+                
+            Log.success("[Part 4/4] finish close-loop control")
+
+
+    def run(self):
+        total = len(os.listdir(self.model_dir))
+        model_start_idx = self.generate_config["model_start_idx"]
+        count_object = model_start_idx
+        for model_name in os.listdir(self.model_dir[model_start_idx:]):
+            Log.info(f"[{count_object}/{total}]Processing {model_name}")
+            self.run_one_model(model_name)
+            Log.success(f"[{count_object}/{total}]Finished processing {model_name}")
+
+
+# ---------------------------- test ---------------------------- #
+if __name__ == "__main__":
+
+    model_path = r"C:\Users\hofee\Downloads\mesh.obj"
+    model = trimesh.load(model_path)
--- a/runners/cad_open_loop_strategy.py
+++ b/runners/cad_open_loop_strategy.py
@@ -0,0 +1,224 @@
+import os
+import time
+import trimesh
+import tempfile
+import subprocess
+import numpy as np
+from PytorchBoot.runners.runner import Runner
+from PytorchBoot.config import ConfigManager
+import PytorchBoot.stereotype as stereotype
+from PytorchBoot.utils.log_util import Log
+from PytorchBoot.status import status_manager
+
+from utils.control_util import ControlUtil
+from utils.communicate_util import CommunicateUtil
+from utils.pts_util import PtsUtil
+from utils.reconstruction_util import ReconstructionUtil
+from utils.preprocess_util import save_scene_data, save_scene_data_multithread
+from utils.data_load import DataLoadUtil
+from utils.view_util import ViewUtil
+
+
+@stereotype.runner("CAD_open_loop_strategy_runner")
+class CADOpenLoopStrategyRunner(Runner):
+
+    def __init__(self, config_path: str):
+        super().__init__(config_path)
+        self.load_experiment("cad_open_loop_strategy")
+        self.status_info = {
+            "status_manager": status_manager,
+            "app_name": "cad",
+            "runner_name": "CAD_open_loop_strategy_runner"
+        }
+        self.generate_config = ConfigManager.get("runner", "generate")
+        self.reconstruct_config = ConfigManager.get("runner", "reconstruct")
+        self.blender_bin_path = self.generate_config["blender_bin_path"]
+        self.generator_script_path = self.generate_config["generator_script_path"]
+        self.model_dir = self.generate_config["model_dir"]
+        self.voxel_size = self.generate_config["voxel_size"]
+        self.max_view = self.generate_config["max_view"]
+        self.min_view = self.generate_config["min_view"]
+        self.max_diag = self.generate_config["max_diag"]
+        self.min_diag = self.generate_config["min_diag"]
+        self.min_cam_table_included_degree = self.generate_config["min_cam_table_included_degree"]
+        self.random_view_ratio = self.generate_config["random_view_ratio"]
+        
+        self.soft_overlap_threshold = self.reconstruct_config["soft_overlap_threshold"]
+        self.hard_overlap_threshold = self.reconstruct_config["hard_overlap_threshold"]
+        self.scan_points_threshold = self.reconstruct_config["scan_points_threshold"]
+        
+    def create_experiment(self, backup_name=None):
+        super().create_experiment(backup_name)
+    
+    def load_experiment(self, backup_name=None):
+        super().load_experiment(backup_name)
+    
+    def split_scan_pts_and_obj_pts(self, world_pts, z_threshold = 0):
+        scan_pts = world_pts[world_pts[:,2] < z_threshold]
+        obj_pts = world_pts[world_pts[:,2] >= z_threshold]
+        return scan_pts, obj_pts
+
+    def run_one_model(self, model_name):
+        temp_dir = "/home/yan20/nbv_rec/project/franka_control/temp_output"
+        result = dict()
+        
+        shot_pts_list = []
+        ControlUtil.connect_robot()
+        ''' init robot '''
+        Log.info("[Part 1/5] start init and register")
+        ControlUtil.init()
+        
+        ''' load CAD model '''
+        model_path = os.path.join(self.model_dir, model_name,"mesh.ply")
+        temp_name = "cad_model_world"
+        cad_model = trimesh.load(model_path)
+        ''' take first view '''
+        Log.info("[Part 1/5] take first view data")
+        view_data = CommunicateUtil.get_view_data(init=True)
+        first_cam_pts = ViewUtil.get_pts(view_data)
+        first_cam_to_real_world = ControlUtil.get_pose()
+        first_real_world_pts = PtsUtil.transform_point_cloud(first_cam_pts, first_cam_to_real_world)
+        _, first_splitted_real_world_pts = self.split_scan_pts_and_obj_pts(first_real_world_pts)
+        np.savetxt(f"first_real_pts_{model_name}.txt", first_splitted_real_world_pts)
+        ''' register '''
+        Log.info("[Part 1/5] do registeration")
+        real_world_to_cad = PtsUtil.register(first_splitted_real_world_pts, cad_model) 
+        cad_to_real_world = np.linalg.inv(real_world_to_cad)
+        Log.success("[Part 1/5] finish init and register")
+        real_world_to_blender_world = np.eye(4)
+        real_world_to_blender_world[:3, 3] = np.asarray([0, 0, 0.9215])
+        cad_model_real_world:trimesh.Trimesh = cad_model.apply_transform(cad_to_real_world)
+        cad_model_real_world.export(os.path.join(temp_dir, f"real_world_{temp_name}.obj"))
+        cad_model_blender_world:trimesh.Trimesh = cad_model.apply_transform(real_world_to_blender_world)
+        
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_dir = "/home/yan20/nbv_rec/project/franka_control/temp_output"
+            cad_model_blender_world.export(os.path.join(temp_dir, f"{temp_name}.obj"))
+            scene_dir = os.path.join(temp_dir, temp_name)
+            ''' sample view '''
+            Log.info("[Part 2/5] start running renderer")
+            subprocess.run([
+                self.blender_bin_path, '-b', '-P', self.generator_script_path, '--', temp_dir
+            ], capture_output=True, text=True)
+            Log.success("[Part 2/5] finish running renderer")
+            
+        
+            world_model_points = np.loadtxt(os.path.join(scene_dir, "points_and_normals.txt"))[:,:3]
+            ''' preprocess '''
+            Log.info("[Part 3/5] start preprocessing data")
+            save_scene_data(temp_dir, temp_name)
+            Log.success("[Part 3/5] finish preprocessing data")
+            
+            pts_dir = os.path.join(temp_dir,temp_name,"pts")
+            sample_view_pts_list = []
+            scan_points_idx_list = []
+            frame_num = len(os.listdir(pts_dir))
+            
+            for frame_idx in range(frame_num):
+                pts_path = os.path.join(temp_dir,temp_name, "pts", f"{frame_idx}.txt")
+                idx_path = os.path.join(temp_dir,temp_name, "scan_points_indices", f"{frame_idx}.npy")
+                point_cloud = np.loadtxt(pts_path)
+                if point_cloud.shape[0] != 0:
+                    sampled_point_cloud = PtsUtil.voxel_downsample_point_cloud(point_cloud, self.voxel_size)
+                indices = np.load(idx_path) 
+                try:
+                    len(indices)
+                except:
+                    indices = np.array([indices])
+                sample_view_pts_list.append(sampled_point_cloud)
+                scan_points_idx_list.append(indices)
+
+            ''' generate strategy '''
+            
+            Log.info("[Part 4/5] start generating strategy")
+            limited_useful_view, _, _ = ReconstructionUtil.compute_next_best_view_sequence_with_overlap(
+                world_model_points, sample_view_pts_list, 
+                scan_points_indices_list = scan_points_idx_list,
+                init_view=0,
+                threshold=self.voxel_size, 
+                soft_overlap_threshold = self.soft_overlap_threshold,
+                hard_overlap_threshold = self.hard_overlap_threshold,
+                scan_points_threshold = self.scan_points_threshold, 
+                status_info=self.status_info
+            )
+            Log.success("[Part 4/5] finish generating strategy")
+        
+            ''' extract cam_to_world sequence  '''
+            cam_to_world_seq = []
+            coveraget_rate_seq = []
+            render_pts = []
+            idx_seq = []
+            for idx, coverage_rate in limited_useful_view:
+                path = DataLoadUtil.get_path(temp_dir, temp_name, idx)
+                cam_info = DataLoadUtil.load_cam_info(path, binocular=True)
+                cam_to_world_seq.append(cam_info["cam_to_world_O"])
+                coveraget_rate_seq.append(coverage_rate)
+                idx_seq.append(idx)
+                render_pts.append(sample_view_pts_list[idx])
+            
+        Log.info("[Part 5/5] start running robot")
+        ''' take best seq view '''
+        #import ipdb; ipdb.set_trace()
+        target_scanned_pts = np.concatenate(sample_view_pts_list)
+        voxel_downsampled_target_scanned_pts = PtsUtil.voxel_downsample_point_cloud(target_scanned_pts, self.voxel_size)
+        result = dict()
+        gt_scanned_pts = np.concatenate(render_pts, axis=0)
+        voxel_down_sampled_gt_scanned_pts = PtsUtil.voxel_downsample_point_cloud(gt_scanned_pts, self.voxel_size)
+        result["gt_final_coverage_rate_cad"] = ReconstructionUtil.compute_coverage_rate(voxel_downsampled_target_scanned_pts, voxel_down_sampled_gt_scanned_pts, self.voxel_size)
+        step = 1
+        result["real_coverage_rate_seq"] = []
+        for cam_to_world in cam_to_world_seq:
+            try:
+                ControlUtil.move_to(cam_to_world)
+                ''' get world pts '''
+                time.sleep(0.5)
+                view_data = CommunicateUtil.get_view_data()
+                if view_data is None:
+                    Log.error("Failed to get view data")
+                    continue
+                cam_pts = ViewUtil.get_pts(view_data)
+                shot_pts_list.append(cam_pts)
+                scanned_pts = np.concatenate(shot_pts_list, axis=0)
+                voxel_down_sampled_scanned_pts = PtsUtil.voxel_downsample_point_cloud(scanned_pts, self.voxel_size)
+                voxel_down_sampled_scanned_pts_world = PtsUtil.transform_point_cloud(voxel_down_sampled_scanned_pts, first_cam_to_real_world)
+                curr_CR = ReconstructionUtil.compute_coverage_rate(voxel_downsampled_target_scanned_pts, voxel_down_sampled_scanned_pts_world, self.voxel_size)
+                Log.success(f"(step {step}/{len(cam_to_world_seq)}) current coverage: {curr_CR} | gt coverage: {result['gt_final_coverage_rate_cad']}")
+                result["real_final_coverage_rate"] = curr_CR
+                result["real_coverage_rate_seq"].append(curr_CR)
+                step += 1
+            except Exception as e:
+                Log.error(f"Failed to move to {cam_to_world}")
+                Log.error(e)
+            
+            #import ipdb;ipdb.set_trace()
+
+        for idx in range(len(shot_pts_list)):
+            if not os.path.exists(os.path.join(temp_dir, temp_name, "shot_pts")):
+                os.makedirs(os.path.join(temp_dir, temp_name, "shot_pts"))
+            if not os.path.exists(os.path.join(temp_dir, temp_name, "render_pts")):
+                os.makedirs(os.path.join(temp_dir, temp_name, "render_pts"))
+            shot_pts = PtsUtil.transform_point_cloud(shot_pts_list[idx], first_cam_to_real_world)
+            np.savetxt(os.path.join(temp_dir, temp_name, "shot_pts", f"{idx}.txt"), shot_pts)
+            np.savetxt(os.path.join(temp_dir, temp_name, "render_pts", f"{idx}.txt"), render_pts[idx])
+        
+            
+        Log.success("[Part 5/5] finish running robot")
+        
+        Log.debug(result)
+    
+    def run(self):
+        total = len(os.listdir(self.model_dir))
+        model_start_idx = self.generate_config["model_start_idx"]
+        count_object = model_start_idx
+        for model_name in os.listdir(self.model_dir[model_start_idx:]):
+            Log.info(f"[{count_object}/{total}]Processing {model_name}")
+            self.run_one_model(model_name)
+            Log.success(f"[{count_object}/{total}]Finished processing {model_name}")
+        
+            
+# ---------------------------- test ---------------------------- #
+if __name__ == "__main__":
+    
+    model_path = r"C:\Users\hofee\Downloads\mesh.obj"
+    model = trimesh.load(model_path)
+    
--- a/runners/cad_strategy.py
+++ b/runners/cad_strategy.py
@@ -1,192 +0,0 @@
-import os
-import trimesh
-import numpy as np
-from PytorchBoot.runners.runner import Runner
-from PytorchBoot.config import ConfigManager
-import PytorchBoot.stereotype as stereotype
-from PytorchBoot.utils.log_util import Log
-from PytorchBoot.status import status_manager
-
-
-import sys
-
-sys.path.append(r"C:\Document\Local Project\nbv_rec_control")
-#from utils.control_util import ControlUtil
-from utils.communicate_util import CommunicateUtil
-from utils.pts_util import PtsUtil
-from utils.view_sample_util import ViewSampleUtil
-from utils.reconstruction_util import ReconstructionUtil
-
-
-@stereotype.runner("CAD_strategy_runner")
-class CADStrategyRunner(Runner):
-
-    def __init__(self, config_path: str):
-        super().__init__(config_path)
-        self.load_experiment("cad_strategy")
-        self.status_info = {
-            "status_manager": status_manager,
-            "app_name": "cad",
-            "runner_name": "cad_strategy"
-        }
-        self.generate_config = ConfigManager.get("runner", "generate")
-        self.reconstruct_config = ConfigManager.get("runner", "reconstruct")
-        self.model_dir = self.generate_config["model_dir"]
-        self.voxel_size = self.generate_config["voxel_size"]
-        self.max_view = self.generate_config["max_view"]
-        self.min_view = self.generate_config["min_view"]
-        self.max_diag = self.generate_config["max_diag"]
-        self.min_diag = self.generate_config["min_diag"]
-        self.min_cam_table_included_degree = self.generate_config["min_cam_table_included_degree"]
-        self.random_view_ratio = self.generate_config["random_view_ratio"]
-        
-        self.soft_overlap_threshold = self.reconstruct_config["soft_overlap_threshold"]
-        self.hard_overlap_threshold = self.reconstruct_config["hard_overlap_threshold"]
-        self.scan_points_threshold = self.reconstruct_config["scan_points_threshold"]
-        
-    def create_experiment(self, backup_name=None):
-        super().create_experiment(backup_name)
-    
-    def load_experiment(self, backup_name=None):
-        super().load_experiment(backup_name)
-        
-    def run_one_model(self, model_name):
-        
-        ''' init robot '''
-        ControlUtil.init()
-        ''' load CAD model '''
-        model_path = os.path.join(self.model_dir, model_name)
-        cad_model = trimesh.load(model_path)
-        ''' take first view '''
-        view_data = CommunicateUtil.get_view_data()
-        first_cam_pts = None
-        ''' register '''
-        cad_to_cam = PtsUtil.register(first_cam_pts, cad_model)
-        cam_to_world = ControlUtil.get_pose()
-        cad_to_world = cam_to_world @ cad_to_cam
-        cad_model:trimesh.Trimesh = cad_model.apply_transform(cad_to_world)
-        ''' sample view '''
-        min_corner = cad_model.bounds[0]
-        max_corner = cad_model.bounds[1] 
-        diag = np.linalg.norm(max_corner - min_corner)
-        view_num = int(self.min_view + (diag - self.min_diag)/(self.max_diag - self.min_diag) * (self.max_view - self.min_view))
-        sampled_view_data = ViewSampleUtil.sample_view_data_world_space(
-            cad_model, cad_to_world,  
-            voxel_size = self.voxel_size,
-            max_views = view_num,
-            min_cam_table_included_degree= self.min_cam_table_included_degree,
-            random_view_ratio = self.random_view_ratio
-        )
-        cam_to_world_poses = sampled_view_data["cam_to_world_poses"]
-        world_model_points = sampled_view_data["voxel_down_sampled_points"]
-
-        ''' take sample view '''
-        scan_points_idx_list = []
-        sample_view_pts_list = []
-        for cam_to_world in cam_to_world_poses:
-            ControlUtil.move_to(cam_to_world)
-            ''' get world pts '''
-            view_data = CommunicateUtil.get_view_data()
-            cam_pts = None
-            scan_points_idx = None
-            world_pts = PtsUtil.transform_point_cloud(cam_pts, cam_to_world)
-            sample_view_pts_list.append(world_pts)
-            scan_points_idx_list.append(scan_points_idx)
-            
-        ''' generate strategy '''
-        scan_points = ReconstructionUtil.generate_scan_points(display_table_top=0, display_table_radius=0.25)
-        
-        limited_useful_view, _, _ = ReconstructionUtil.compute_next_best_view_sequence_with_overlap(
-            world_model_points, sample_view_pts_list, 
-            scan_points_indices_list = scan_points_idx_list,
-            init_view=0,
-            threshold=self.voxel_size, 
-            soft_overlap_threshold = self.soft_overlap_threshold,
-            hard_overlap_threshold = self.hard_overlap_threshold,
-            scan_points_threshold = self.scan_points_threshold, 
-            status_info=self.status_info
-        )
-        
-        ''' extract cam_to_world sequence  '''
-        cam_to_world_seq = []
-        coveraget_rate_seq = []
-        
-        for idx, coverage_rate in limited_useful_view:
-            cam_to_world_seq.append(cam_to_world_poses[idx])
-            coveraget_rate_seq.append(coverage_rate)
-            
-        ''' take best seq view '''
-        for cam_to_world in cam_to_world_seq:
-            ControlUtil.move_to(cam_to_world)
-            ''' get world pts '''
-            view_data = CommunicateUtil.get_view_data()
-            cam_pts = None
-            scan_points_idx = None
-            world_pts = PtsUtil.transform_point_cloud(cam_pts, cam_to_world)
-            sample_view_pts_list.append(world_pts)
-            scan_points_idx_list.append(scan_points_idx)
-        
-    
-    def run(self):
-        total = len(os.listdir(self.model_dir))
-        model_start_idx = self.generate_config["model_start_idx"]
-        count_object = model_start_idx
-        for model_name in os.listdir(self.model_dir[model_start_idx:]):
-            Log.info(f"[{count_object}/{total}]Processing {model_name}")
-            self.run_one_model(model_name)
-            Log.success(f"[{count_object}/{total}]Finished processing {model_name}")
-        
-            
-# ---------------------------- test ---------------------------- #
-if __name__ == "__main__":
-    
-    model_path = r"C:\Users\hofee\Downloads\mesh.obj"
-    model = trimesh.load(model_path)
-    
-    ''' test register '''
-    # test_pts_L = np.load(r"C:\Users\hofee\Downloads\0.npy")
-    
-    # import open3d as o3d
-    # def add_noise(points, translation, rotation):
-    #     R = o3d.geometry.get_rotation_matrix_from_axis_angle(rotation)
-    #     noisy_points = points @ R.T + translation
-    #     return noisy_points
-    
-    # translation_noise = np.random.uniform(-0.5, 0.5, size=3)
-    # rotation_noise = np.random.uniform(-np.pi/4, np.pi/4, size=3) 
-    # noisy_pts_L = add_noise(test_pts_L, translation_noise, rotation_noise)
-    
-    # cad_to_cam_L = PtsUtil.register(noisy_pts_L, model)
-    
-    # cad_pts_L = PtsUtil.transform_point_cloud(noisy_pts_L, cad_to_cam_L)
-    # np.savetxt(r"test.txt", cad_pts_L)
-    # np.savetxt(r"src.txt", noisy_pts_L)
-    
-    ''' test view sample '''
-    
-    sampled_view_data = ViewSampleUtil.sample_view_data_world_space(
-            model, np.eye(4),  
-            voxel_size = 0.005,
-            max_views = 20,
-            min_cam_table_included_degree= 20,
-            random_view_ratio = 0
-        )
-    cam_poses = sampled_view_data["cam_to_world_poses"]
-    cam_poses = np.array(cam_poses)
-    print(cam_poses.shape)
-    def sample_camera_direction(cam_pose, num_samples, sample_distance):
-        cam_position = cam_pose[:3, 3]
-        cam_direction = cam_pose[:3, 2]
-        sampled_points = np.array([cam_position - (i + 1) * sample_distance * cam_direction for i in range(num_samples)])
-        return sampled_points
-    
-    all_sampled_points = []
-    for i in range(cam_poses.shape[0]):
-        samped_points = sample_camera_direction(cam_poses[i], 10, 0.02)
-        all_sampled_points.append(samped_points)
-        
-    all_sampled_points = np.concatenate(all_sampled_points, axis=0)
-    np.savetxt(r"cam_poses.txt", cam_poses[:, :3, 3])
-    np.savetxt(r"cam_directions.txt", all_sampled_points)
-    
-    
--- a/runners/inference.py
+++ b/runners/inference.py
@@ -1,87 +0,0 @@
-import os
-import trimesh
-import numpy as np
-from PytorchBoot.runners.runner import Runner
-from PytorchBoot.config import ConfigManager
-import PytorchBoot.stereotype as stereotype
-from PytorchBoot.utils.log_util import Log
-import PytorchBoot.namespace as namespace
-from PytorchBoot.status import status_manager
-
-from utils.control_util import ControlUtil
-from utils.communicate_util import CommunicateUtil
-from utils.pts_util import PtsUtil
-from utils.view_sample_util import ViewSampleUtil
-from utils.reconstruction_util import ReconstructionUtil
-
-
-@stereotype.runner("inferencer")
-class Inferencer(Runner):
-
-    def __init__(self, config_path: str):
-        super().__init__(config_path)
-        self.load_experiment("inferencer")
-        self.reconstruct_config = ConfigManager.get("runner", "reconstruct")
-        self.voxel_size = self.reconstruct_config["voxel_size"]
-        self.max_iter = self.reconstruct_config["max_iter"]
-        
-    def create_experiment(self, backup_name=None):
-        super().create_experiment(backup_name)
-    
-    def load_experiment(self, backup_name=None):
-        super().load_experiment(backup_name)
-        
-    def run_inference(self, model_name):
-        
-        ''' init robot '''
-        ControlUtil.init()
-        ''' take first view '''
-        view_data = CommunicateUtil.get_view_data()
-        first_cam_pts = None
-        first_cam_pose = None
-        combined_pts = first_cam_pts
-        input_data = {
-            "scanned_target_points_num": [first_cam_pts.shape[0]],
-            "scanned_n_to_world_pose_9d": [first_cam_pose],
-            "combined_scanned_pts": combined_pts
-        }
-        ''' enter loop '''
-        iter = 0
-        while True:
-            ''' inference '''
-            inference_result = CommunicateUtil.get_inference_data(input_data)
-            cam_to_world = inference_result["cam_to_world"]
-            ''' set pose '''
-            ControlUtil.set_pose(cam_to_world)
-            ''' take view '''
-            view_data = CommunicateUtil.get_view_data()
-            curr_cam_pts = None
-            curr_cam_pose = None
-            ''' update combined pts '''
-            combined_pts = np.concatenate([combined_pts, curr_cam_pts], axis=0)
-            combined_pts = PtsUtil.voxel_downsample_point_cloud(combined_pts, voxel_size=self.voxel_size)
-            ''' update input data '''
-            input_data["combined_scanned_pts"] = combined_pts
-            input_data["scanned_target_points_num"].append(curr_cam_pts.shape[0])
-            input_data["scanned_n_to_world_pose_9d"].append(curr_cam_pose)
-            
-            ''' check stop condition '''
-            if iter >= self.max_iter:
-                break
-            
-    
-    def run(self):
-        self.run_inference()
-            
-    
-if __name__ == "__main__":
-    model_path = "/home/yan20/nbv_rec/data/test_CAD/test_model/bear_scaled.ply"
-    model = trimesh.load(model_path)
-    test_pts_L = np.loadtxt("/home/yan20/nbv_rec/data/test_CAD/cam_pts_0_L.txt")
-    test_pts_R = np.loadtxt("/home/yan20/nbv_rec/data/test_CAD/cam_pts_0_R.txt")
-    cam_to_world_L = PtsUtil.register_icp(test_pts_L, model)
-    cam_to_world_R = PtsUtil.register_icp(test_pts_R, model)
-    print(cam_to_world_L)
-    print("================================")
-    print(cam_to_world_R)
-    
--- a/runners/renderer.py
+++ b/runners/renderer.py
@@ -1,127 +0,0 @@
-import os
-import trimesh
-import numpy as np
-from PytorchBoot.runners.runner import Runner
-from PytorchBoot.config import ConfigManager
-import PytorchBoot.stereotype as stereotype
-from PytorchBoot.utils.log_util import Log
-from PytorchBoot.status import status_manager
-
-#from utils.control_util import ControlUtil
-from utils.communicate_util import CommunicateUtil
-from utils.pts_util import PtsUtil
-from utils.view_sample_util import ViewSampleUtil
-from utils.reconstruction_util import ReconstructionUtil
-
-
-@stereotype.runner("online_renderer")
-class OnlineRenderer(Runner):
-
-    def __init__(self, config_path: str):
-        super().__init__(config_path)
-        self.load_experiment("cad_strategy")
-        self.host = ConfigManager.get("runner", "web", "host")
-        self.port = ConfigManager.get("runner", "web", "port")
-        
-    def create_experiment(self, backup_name=None):
-        super().create_experiment(backup_name)
-    
-    def load_experiment(self, backup_name=None):
-        super().load_experiment(backup_name)
-        
-    def run_one_model(self, model_name):
-        
-        ''' init robot '''
-        ControlUtil.init()
-        ''' load CAD model '''
-        model_path = os.path.join(self.model_dir, model_name)
-        cad_model = trimesh.load(model_path)
-        ''' take first view '''
-        view_data = CommunicateUtil.get_view_data()
-        first_cam_pts = None
-        ''' register '''
-        cad_to_cam = PtsUtil.register(first_cam_pts, cad_model)
-        cam_to_world = ControlUtil.get_pose()
-        cad_to_world = cam_to_world @ cad_to_cam
-        cad_model:trimesh.Trimesh = cad_model.apply_transform(cad_to_world)
-        ''' sample view '''
-        min_corner = cad_model.bounds[0]
-        max_corner = cad_model.bounds[1] 
-        diag = np.linalg.norm(max_corner - min_corner)
-        view_num = int(self.min_view + (diag - self.min_diag)/(self.max_diag - self.min_diag) * (self.max_view - self.min_view))
-        sampled_view_data = ViewSampleUtil.sample_view_data_world_space(
-            cad_model, cad_to_world,  
-            voxel_size = self.voxel_size,
-            max_views = view_num,
-            min_cam_table_included_degree= self.min_cam_table_included_degree,
-            random_view_ratio = self.random_view_ratio
-        )
-        cam_to_world_poses = sampled_view_data["cam_to_world_poses"]
-        world_model_points = sampled_view_data["voxel_down_sampled_points"]
-
-        ''' take sample view '''
-        scan_points_idx_list = []
-        sample_view_pts_list = []
-        for cam_to_world in cam_to_world_poses:
-            ControlUtil.move_to(cam_to_world)
-            ''' get world pts '''
-            view_data = CommunicateUtil.get_view_data()
-            cam_pts = None
-            scan_points_idx = None
-            world_pts = PtsUtil.transform_point_cloud(cam_pts, cam_to_world)
-            sample_view_pts_list.append(world_pts)
-            scan_points_idx_list.append(scan_points_idx)
-            
-        ''' generate strategy '''
-        scan_points = ReconstructionUtil.generate_scan_points(display_table_top=0, display_table_radius=0.25)
-        
-        limited_useful_view, _, _ = ReconstructionUtil.compute_next_best_view_sequence_with_overlap(
-            world_model_points, sample_view_pts_list, 
-            scan_points_indices_list = scan_points_idx_list,
-            init_view=0,
-            threshold=self.voxel_size, 
-            soft_overlap_threshold = self.soft_overlap_threshold,
-            hard_overlap_threshold = self.hard_overlap_threshold,
-            scan_points_threshold = self.scan_points_threshold, 
-            status_info=self.status_info
-        )
-        
-        ''' extract cam_to_world sequence  '''
-        cam_to_world_seq = []
-        coveraget_rate_seq = []
-        
-        for idx, coverage_rate in limited_useful_view:
-            cam_to_world_seq.append(cam_to_world_poses[idx])
-            coveraget_rate_seq.append(coverage_rate)
-            
-        ''' take best seq view '''
-        for cam_to_world in cam_to_world_seq:
-            ControlUtil.move_to(cam_to_world)
-            ''' get world pts '''
-            view_data = CommunicateUtil.get_view_data()
-            cam_pts = None
-            scan_points_idx = None
-            world_pts = PtsUtil.transform_point_cloud(cam_pts, cam_to_world)
-            sample_view_pts_list.append(world_pts)
-            scan_points_idx_list.append(scan_points_idx)
-        
-    
-    def run(self):
-        total = len(os.listdir(self.model_dir))
-        model_start_idx = self.generate_config["model_start_idx"]
-        count_object = model_start_idx
-        for model_name in os.listdir(self.model_dir[model_start_idx:]):
-            Log.info(f"[{count_object}/{total}]Processing {model_name}")
-            self.run_one_model(model_name)
-            Log.success(f"[{count_object}/{total}]Finished processing {model_name}")
-        
-            
-# ---------------------------- test ---------------------------- #
-if __name__ == "__main__":
-    
-    model_path = r"C:\Users\hofee\Downloads\mesh.obj"
-    model = trimesh.load(model_path)
-    
-
-    
-    
--- a/utils/communicate_util.py
+++ b/utils/communicate_util.py
@@ -1,13 +1,35 @@
+import requests
+import numpy as np

 class CommunicateUtil:
-    VIEW_HOST = "127.0.0.1:5000"
-    INFERENCE_HOST = "127.0.0.1:5000"
+    VIEW_HOST = "192.168.1.2:7999"  #"10.7.250.52:7999" ##
+    INFERENCE_HOST = "127.0.0.1"
+    INFERENCE_PORT = 5000
    
-    def get_view_data() -> dict:
-        data = {}
-        return data
+    def get_view_data(init = False) -> dict:
+        params = {}
+        params["create_scanner"] = init
+        response = requests.get(f"http://{CommunicateUtil.VIEW_HOST}/api/data", json=params)
+        data = response.json()
+        
+        if not data["success"]:
+            print(f"Failed to get view data")
+            return None
+        
+        image_id = data["image_id"]
+        depth_image = np.array(data["depth_image"], dtype=np.uint16)
+        depth_intrinsics = data["depth_intrinsics"]
+        depth_extrinsics = np.array(data["depth_extrinsics"])
+        view_data = {
+            "image_id": image_id,
+            "depth_image": depth_image,
+            "depth_intrinsics": depth_intrinsics,
+            "depth_extrinsics": depth_extrinsics
+        }
+        return view_data
    
    def get_inference_data(view_data:dict) -> dict:
        data = {}
        return data
+        
        
--- a/utils/control_util.py
+++ b/utils/control_util.py
@@ -1,41 +1,51 @@
 import numpy as np
 from frankapy import FrankaArm
 from autolab_core import RigidTransform
+import serial
+import time

 class ControlUtil:
    
-    __fa = FrankaArm(robot_num=2)
+    __fa:FrankaArm = None
+    __ser: serial.Serial = None
+    curr_rotation = 0
    
    BASE_TO_WORLD:np.ndarray = np.asarray([
-        [1, 0, 0, -0.5],
-        [0, 1, 0, 0],
-        [0, 0, 1, -0.2],
+        [1, 0, 0, -0.61091665],
+        [0, 1, 0, -0.00309726],
+        [0, 0, 1, -0.1136743],
        [0, 0, 0, 1]
        ])
    
    CAMERA_TO_GRIPPER:np.ndarray = np.asarray([
+        [0, -1, 0, 0.01],
        [1, 0, 0, 0],
-        [0, 1, 0, 0],
-        [0, 0, 1, 0],
+        [0, 0, 1, 0.08],
        [0, 0, 0, 1]
        ])
-    theta = np.radians(25)
-    INIT_POSE:np.ndarray = np.asarray([
-        [np.cos(theta), 0, -np.sin(theta), 0],
-        [0, -1, 0, 0],
-        [-np.sin(theta), 0, -np.cos(theta), 0.35],
-        [0, 0, 0, 1]
+    INIT_GRIPPER_POSE:np.ndarray = np.asarray([
+        [ 0.46532393,  0.62171798,  0.63002284,  0.21230963],
+        [ 0.43205618, -0.78075723,  0.45136491, -0.25127173],
+        [ 0.77251656,  0.06217437, -0.63193429,  0.499957  ],
+        [ 0.        ,  0.        ,  0.        ,  1.        ],
        ])
+
    
-    AXIS_THRESHOLD = (-(np.pi+5e-2)/2, (np.pi+5e-2)/2)
-    
+    @staticmethod
+    def connect_robot():
+        if ControlUtil.__fa is None:
+            ControlUtil.__fa = FrankaArm(robot_num=2)
+        if ControlUtil.__ser is None:
+            ControlUtil.__ser = serial.Serial(port="/dev/ttyUSB0", baudrate=115200) 
+        
    @staticmethod
    def franka_reset() -> None:
        ControlUtil.__fa.reset_joints()
        
    @staticmethod
    def init() -> None:
-        ControlUtil.set_pose(ControlUtil.INIT_POSE)
+        ControlUtil.franka_reset()
+        ControlUtil.set_gripper_pose(ControlUtil.INIT_GRIPPER_POSE)
        
    @staticmethod
    def get_pose() -> np.ndarray:
@@ -46,17 +56,35 @@ class ControlUtil:
    @staticmethod
    def set_pose(cam_to_world: np.ndarray) -> None:
        gripper_to_base = ControlUtil.solve_gripper_to_base(cam_to_world)
-        gripper_to_base = RigidTransform(rotation=gripper_to_base[:3, :3], translation=gripper_to_base[:3, 3], from_frame="franka_tool", to_frame="world")
-        ControlUtil.__fa.goto_pose(gripper_to_base, use_impedance=False, ignore_errors=False)
+        ControlUtil.set_gripper_pose(gripper_to_base)
        
    @staticmethod
    def rotate_display_table(degree):
-        pass
+        turn_directions = {
+            "left": 1,
+            "right": 0
+        }
+        delta_degree = degree - ControlUtil.curr_rotation
+        ControlUtil.curr_rotation += delta_degree
+        print(f"Table rotated {ControlUtil.cnt_rotation} degree")
+        if degree >= 0:
+            turn_angle = delta_degree
+            turn_direction = turn_directions["right"]
+        else:
+            turn_angle = -delta_degree
+            turn_direction = turn_directions["left"]
+        write_len = ControlUtil.__ser.write(f"CT+TRUNSINGLE({turn_direction},{turn_angle});".encode('utf-8'))
+        
    
    @staticmethod
    def get_curr_gripper_to_base_pose() -> np.ndarray:
        return ControlUtil.__fa.get_pose().matrix
    
+    @staticmethod
+    def set_gripper_pose(gripper_to_base: np.ndarray) -> None:
+        gripper_to_base = RigidTransform(rotation=gripper_to_base[:3, :3], translation=gripper_to_base[:3, 3], from_frame="franka_tool", to_frame="world")
+        ControlUtil.__fa.goto_pose(gripper_to_base, duration=5, use_impedance=False, ignore_errors=False)
+        
    @staticmethod
    def solve_gripper_to_base(cam_to_world: np.ndarray) -> np.ndarray:
        return np.linalg.inv(ControlUtil.BASE_TO_WORLD) @ cam_to_world @ np.linalg.inv(ControlUtil.CAMERA_TO_GRIPPER)
@@ -66,24 +94,38 @@ class ControlUtil:
        return ControlUtil.BASE_TO_WORLD @ gripper_to_base @ ControlUtil.CAMERA_TO_GRIPPER
    
    @staticmethod
-    def solve_display_table_rot_and_cam_to_world(cam_to_world: np.ndarray) -> tuple:
-        gripper_to_base = ControlUtil.solve_gripper_to_base(cam_to_world)
-        gripper_to_base_axis_angle = ControlUtil.get_gripper_to_base_axis_angle(gripper_to_base)
+    def check_limit(new_cam_to_world):
+        if new_cam_to_world[0,3] > 0 or new_cam_to_world[1,3] > 0:
+            return False
+        x = abs(new_cam_to_world[0,3])
+        y = abs(new_cam_to_world[1,3])
        
-        if ControlUtil.AXIS_THRESHOLD[0] <= gripper_to_base_axis_angle <= ControlUtil.AXIS_THRESHOLD[1]:
+        tan_y_x = y/x
+        if tan_y_x < np.sqrt(3)/3 or tan_y_x > np.sqrt(3):
+            return False
+         
+        return True
+    
+    @staticmethod
+    def solve_display_table_rot_and_cam_to_world(cam_to_world: np.ndarray) -> tuple:   
+        if ControlUtil.check_limit(cam_to_world):
            return 0, cam_to_world
        else:
-            for display_table_rot in np.linspace(0.1,180, 1800):
+            min_display_table_rot = 180
+            min_new_cam_to_world = None
+            for display_table_rot in np.linspace(0.1,360, 1800):
                display_table_rot_z_pose = ControlUtil.get_z_axis_rot_mat(display_table_rot)
-                new_cam_to_world = display_table_rot_z_pose @ cam_to_world
-                if ControlUtil.AXIS_THRESHOLD[0] <= ControlUtil.get_gripper_to_base_axis_angle(new_cam_to_world) <= ControlUtil.AXIS_THRESHOLD[1]:
-                    return -display_table_rot, new_cam_to_world
-                
-                display_table_rot = -display_table_rot
-                display_table_rot_z_pose = ControlUtil.get_z_axis_rot_mat(display_table_rot)
-                new_cam_to_world = display_table_rot_z_pose @ cam_to_world
-                if ControlUtil.AXIS_THRESHOLD[0] <= ControlUtil.get_gripper_to_base_axis_angle(new_cam_to_world) <= ControlUtil.AXIS_THRESHOLD[1]:
-                    return -display_table_rot, new_cam_to_world
+                new_cam_to_world = np.linalg.inv(display_table_rot_z_pose) @ cam_to_world
+                if ControlUtil.check_limit(new_cam_to_world):
+                    if display_table_rot < min_display_table_rot:
+                        min_display_table_rot, min_new_cam_to_world = display_table_rot, new_cam_to_world
+                    if abs(display_table_rot - 360) < min_display_table_rot:
+                        min_display_table_rot, min_new_cam_to_world = display_table_rot - 360, new_cam_to_world
+        
+        if min_new_cam_to_world is None:
+            raise ValueError("No valid display table rotation found")
+        
+        return min_display_table_rot, min_new_cam_to_world
                
    @staticmethod
    def get_z_axis_rot_mat(degree):
@@ -106,36 +148,80 @@ class ControlUtil:
    @staticmethod
    def move_to(pose: np.ndarray):
        rot_degree, cam_to_world = ControlUtil.solve_display_table_rot_and_cam_to_world(pose)
-        print("table rot degree:", rot_degree)
+        exec_time = abs(rot_degree)/9
+        start_time = time.time()
        ControlUtil.rotate_display_table(rot_degree)
        ControlUtil.set_pose(cam_to_world)
-        
-        
+        end_time = time.time()
+        print(f"Move to pose with rotation {rot_degree} degree, exec time: {end_time - start_time}|exec time: {exec_time}")
+        if end_time - start_time < exec_time:
+            time.sleep(exec_time - (end_time - start_time))
+            
 # ----------- Debug Test -------------

 if __name__ == "__main__":
+    ControlUtil.connect_robot()
+    # ControlUtil.franka_reset()
+    def main_test():
+        print(ControlUtil.get_curr_gripper_to_base_pose())
+        ControlUtil.init()
+    
+    def rotate_back(rotation):
+        ControlUtil.rotate_display_table(-rotation)
+    
+    #main_test()
+    import sys; sys.path.append("/home/yan20/nbv_rec/project/franka_control")
+    from utils.communicate_util import CommunicateUtil
+    import ipdb
    ControlUtil.init()
-    import time
-    start = time.time()
-    rot_degree, cam_to_world = ControlUtil.solve_display_table_rot_and_cam_to_world(ControlUtil.INIT_POSE)
-    end = time.time()
-    print(f"Time: {end-start}")
-    print(rot_degree, cam_to_world)
-    # test_pose = np.asarray([
-    #      [1, 0, 0, 0.4],
-    #     [0, -1, 0, 0],
-    #     [0, 0, -1, 0.6],
-    #     [0, 0, 0, 1]
-    #      ])
-    # ControlUtil.set_pose(test_pose)
-    # print(ControlUtil.get_pose())
-    # ControlUtil.reset()
-    # print(ControlUtil.get_pose())
+    view_data_0 = CommunicateUtil.get_view_data(init=True)
+    depth_extrinsics_0 = view_data_0["depth_extrinsics"]
+    cam_to_world_0 = ControlUtil.get_pose()
+    print("cam_extrinsics_0")
+    print(depth_extrinsics_0)
+    print("cam_to_world_0")
+    print(cam_to_world_0)
    
-    angle = ControlUtil.get_gripper_to_base_axis_angle(ControlUtil.solve_gripper_to_base(cam_to_world))
-    threshold = ControlUtil.AXIS_THRESHOLD
+    ipdb.set_trace()
+    TEST_POSE:np.ndarray = np.asarray([
+        [ 0.46532393,  0.62171798,  0.63002284,  0.30230963],
+        [ 0.43205618, -0.78075723,  0.45136491, -0.29127173],
+        [ 0.77251656,  0.06217437, -0.63193429,  0.559957  ],
+        [ 0.        ,  0.        ,  0.        ,  1.        ],
+        ])
+    TEST_POSE_CAM_TO_WORLD = ControlUtil.BASE_TO_WORLD @ TEST_POSE @ ControlUtil.CAMERA_TO_GRIPPER
+    ControlUtil.move_to(TEST_POSE_CAM_TO_WORLD)
+    view_data_1 = CommunicateUtil.get_view_data()
+    depth_extrinsics_1 = view_data_1["depth_extrinsics"]
+    depth_extrinsics_1[:3,3] = depth_extrinsics_1[:3,3] / 1000
+    cam_to_world_1 = ControlUtil.get_pose()
+    print("cam_extrinsics_1")
+    print(depth_extrinsics_1)
+    print("cam_to_world_1")
+    print(TEST_POSE_CAM_TO_WORLD)
+    actual_cam_to_world_1 = cam_to_world_0 @ depth_extrinsics_1
+    print("actual_cam_to_world_1")
+    print(actual_cam_to_world_1)
+    ipdb.set_trace()
+    TEST_POSE_2:np.ndarray = np.asarray(
+        [[ 0.74398544, -0.61922696,  0.251049,    0.47000935],
+        [-0.47287207, -0.75338888, -0.45692666,  0.20843903],
+        [ 0.47207883 , 0.22123272, -0.85334192,  0.57863381],
+        [ 0. ,         0.   ,       0.  ,        1.  ,      ]]
+        )
+    TEST_POSE_CAM_TO_WORLD_2 = ControlUtil.BASE_TO_WORLD @ TEST_POSE_2 @ ControlUtil.CAMERA_TO_GRIPPER
    
-    angle_degree = np.degrees(angle)
-    threshold_degree = np.degrees(threshold[0]), np.degrees(threshold[1])
-    print(f"Angle: {angle_degree}, range: {threshold_degree}")
-    ControlUtil.set_pose(cam_to_world)
+    #ControlUtil.move_to(TEST_POSE_CAM_TO_WORLD_2)
+    ControlUtil.set_pose(TEST_POSE_CAM_TO_WORLD_2)
+    view_data_2 = CommunicateUtil.get_view_data()
+    depth_extrinsics_2 = view_data_2["depth_extrinsics"]
+    depth_extrinsics_2[:3,3] = depth_extrinsics_2[:3,3] / 1000
+    cam_to_world_2 = ControlUtil.get_pose()
+    print("cam_extrinsics_2")
+    print(depth_extrinsics_2)
+    print("cam_to_world_2")
+    print(TEST_POSE_CAM_TO_WORLD_2)
+    actual_cam_to_world_2 = cam_to_world_0 @ depth_extrinsics_2
+    print("actual_cam_to_world_2")
+    print(actual_cam_to_world_2)
+    ipdb.set_trace()
--- a/utils/data_load.py
+++ b/utils/data_load.py
@@ -0,0 +1,410 @@
+import os
+import numpy as np
+import json
+import cv2
+import trimesh
+import torch
+from utils.pts_util import PtsUtil
+
+
+class DataLoadUtil:
+    TABLE_POSITION = np.asarray([0, 0, 0.8215])
+
+    @staticmethod
+    def get_display_table_info(root, scene_name):
+        scene_info = DataLoadUtil.load_scene_info(root, scene_name)
+        display_table_info = scene_info["display_table"]
+        return display_table_info
+
+    @staticmethod
+    def get_display_table_top(root, scene_name):
+        display_table_height = DataLoadUtil.get_display_table_info(root, scene_name)[
+            "height"
+        ]
+        display_table_top = DataLoadUtil.TABLE_POSITION + np.asarray(
+            [0, 0, display_table_height]
+        )
+        return display_table_top
+
+    @staticmethod
+    def get_path(root, scene_name, frame_idx):
+        path = os.path.join(root, scene_name, f"{frame_idx}")
+        return path
+
+    @staticmethod
+    def get_label_num(root, scene_name):
+        label_dir = os.path.join(root, scene_name, "label")
+        return len(os.listdir(label_dir))
+
+    @staticmethod
+    def get_label_path(root, scene_name, seq_idx):
+        label_dir = os.path.join(root, scene_name, "label")
+        if not os.path.exists(label_dir):
+            os.makedirs(label_dir)
+        path = os.path.join(label_dir, f"{seq_idx}.json")
+        return path
+
+    @staticmethod
+    def get_label_path_old(root, scene_name):
+        path = os.path.join(root, scene_name, "label.json")
+        return path
+
+    @staticmethod
+    def get_scene_seq_length(root, scene_name):
+        camera_params_path = os.path.join(root, scene_name, "camera_params")
+        return len(os.listdir(camera_params_path))
+
+    @staticmethod
+    def load_mesh_at(model_dir, object_name, world_object_pose):
+        model_path = os.path.join(model_dir, object_name, "mesh.obj")
+        mesh = trimesh.load(model_path)
+        mesh.apply_transform(world_object_pose)
+        return mesh
+
+    @staticmethod
+    def get_bbox_diag(model_dir, object_name):
+        model_path = os.path.join(model_dir, object_name, "mesh.obj")
+        mesh = trimesh.load(model_path)
+        bbox = mesh.bounding_box.extents
+        diagonal_length = np.linalg.norm(bbox)
+        return diagonal_length
+
+    @staticmethod
+    def save_mesh_at(model_dir, output_dir, object_name, scene_name, world_object_pose):
+        mesh = DataLoadUtil.load_mesh_at(model_dir, object_name, world_object_pose)
+        model_path = os.path.join(output_dir, scene_name, "world_mesh.obj")
+        mesh.export(model_path)
+
+    @staticmethod
+    def save_target_mesh_at_world_space(
+        root, model_dir, scene_name, display_table_as_world_space_origin=True
+    ):
+        scene_info = DataLoadUtil.load_scene_info(root, scene_name)
+        target_name = scene_info["target_name"]
+        transformation = scene_info[target_name]
+        if display_table_as_world_space_origin:
+            location = transformation["location"] - DataLoadUtil.get_display_table_top(
+                root, scene_name
+            )
+        else:
+            location = transformation["location"]
+        rotation_euler = transformation["rotation_euler"]
+        pose_mat = trimesh.transformations.euler_matrix(*rotation_euler)
+        pose_mat[:3, 3] = location
+
+        mesh = DataLoadUtil.load_mesh_at(model_dir, target_name, pose_mat)
+        mesh_dir = os.path.join(root, scene_name, "mesh")
+        if not os.path.exists(mesh_dir):
+            os.makedirs(mesh_dir)
+        model_path = os.path.join(mesh_dir, "world_target_mesh.obj")
+        mesh.export(model_path)
+
+    @staticmethod
+    def load_scene_info(root, scene_name):
+        scene_info_path = os.path.join(root, scene_name, "scene_info.json")
+        with open(scene_info_path, "r") as f:
+            scene_info = json.load(f)
+        return scene_info
+
+    @staticmethod
+    def load_target_pts_num_dict(root, scene_name):
+        target_pts_num_path = os.path.join(root, scene_name, "target_pts_num.json")
+        with open(target_pts_num_path, "r") as f:
+            target_pts_num_dict = json.load(f)
+        return target_pts_num_dict
+
+    @staticmethod
+    def load_target_object_pose(root, scene_name):
+        scene_info = DataLoadUtil.load_scene_info(root, scene_name)
+        target_name = scene_info["target_name"]
+        transformation = scene_info[target_name]
+        location = transformation["location"]
+        rotation_euler = transformation["rotation_euler"]
+        pose_mat = trimesh.transformations.euler_matrix(*rotation_euler)
+        pose_mat[:3, 3] = location
+        return pose_mat
+
+    @staticmethod
+    def load_depth(path, min_depth=0.01, max_depth=5.0, binocular=False):
+
+        def load_depth_from_real_path(real_path, min_depth, max_depth):
+            depth = cv2.imread(real_path, cv2.IMREAD_UNCHANGED)
+            depth = depth.astype(np.float32) / 65535.0
+            min_depth = min_depth
+            max_depth = max_depth
+            depth_meters = min_depth + (max_depth - min_depth) * depth
+            return depth_meters
+
+        if binocular:
+            depth_path_L = os.path.join(
+                os.path.dirname(path), "depth", os.path.basename(path) + "_L.png"
+            )
+            depth_path_R = os.path.join(
+                os.path.dirname(path), "depth", os.path.basename(path) + "_R.png"
+            )
+            depth_meters_L = load_depth_from_real_path(
+                depth_path_L, min_depth, max_depth
+            )
+            depth_meters_R = load_depth_from_real_path(
+                depth_path_R, min_depth, max_depth
+            )
+            return depth_meters_L, depth_meters_R
+        else:
+            depth_path = os.path.join(
+                os.path.dirname(path), "depth", os.path.basename(path) + ".png"
+            )
+            depth_meters = load_depth_from_real_path(depth_path, min_depth, max_depth)
+            return depth_meters
+
+    @staticmethod
+    def load_seg(path, binocular=False, left_only=False):
+        if binocular and not left_only:
+
+            def clean_mask(mask_image):
+                green = [0, 255, 0, 255]
+                red = [255, 0, 0, 255]
+                threshold = 2
+                mask_image = np.where(
+                    np.abs(mask_image - green) <= threshold, green, mask_image
+                )
+                mask_image = np.where(
+                    np.abs(mask_image - red) <= threshold, red, mask_image
+                )
+                return mask_image
+
+            mask_path_L = os.path.join(
+                os.path.dirname(path), "mask", os.path.basename(path) + "_L.png"
+            )
+            mask_image_L = clean_mask(cv2.imread(mask_path_L, cv2.IMREAD_UNCHANGED))
+            mask_path_R = os.path.join(
+                os.path.dirname(path), "mask", os.path.basename(path) + "_R.png"
+            )
+            mask_image_R = clean_mask(cv2.imread(mask_path_R, cv2.IMREAD_UNCHANGED))
+            return mask_image_L, mask_image_R
+        else:
+            if binocular and left_only:
+                mask_path = os.path.join(
+                    os.path.dirname(path), "mask", os.path.basename(path) + "_L.png"
+                )
+            else:
+                mask_path = os.path.join(
+                    os.path.dirname(path), "mask", os.path.basename(path) + ".png"
+                )
+            mask_image = cv2.imread(mask_path, cv2.IMREAD_UNCHANGED)
+            return mask_image
+        
+    @staticmethod
+    def load_normal(path, binocular=False, left_only=False):
+        if binocular and not left_only:
+            normal_path_L = os.path.join(
+                os.path.dirname(path), "normal", os.path.basename(path) + "_L.png"
+            )
+            normal_image_L = cv2.imread(normal_path_L, cv2.IMREAD_COLOR)
+            normal_path_R = os.path.join(
+                os.path.dirname(path), "normal", os.path.basename(path) + "_R.png"
+            )
+            normal_image_R = cv2.imread(normal_path_R, cv2.IMREAD_COLOR)
+            normalized_normal_image_L = normal_image_L / 255.0 * 2.0 - 1.0
+            normalized_normal_image_R = normal_image_R / 255.0 * 2.0 - 1.0
+            return normalized_normal_image_L, normalized_normal_image_R
+        else:
+            if binocular and left_only:
+                normal_path = os.path.join(
+                    os.path.dirname(path), "normal", os.path.basename(path) + "_L.png"
+                )
+            else:
+                normal_path = os.path.join(
+                    os.path.dirname(path), "normal", os.path.basename(path) + ".png"
+                )
+            normal_image = cv2.imread(normal_path, cv2.IMREAD_COLOR)
+            normalized_normal_image = normal_image / 255.0 * 2.0 - 1.0
+            return normalized_normal_image
+
+    @staticmethod
+    def load_label(path):
+        with open(path, "r") as f:
+            label_data = json.load(f)
+        return label_data
+
+    @staticmethod
+    def load_rgb(path):
+        rgb_path = os.path.join(
+            os.path.dirname(path), "rgb", os.path.basename(path) + ".png"
+        )
+        rgb_image = cv2.imread(rgb_path, cv2.IMREAD_COLOR)
+        return rgb_image
+
+    @staticmethod
+    def load_from_preprocessed_pts(path):
+        npy_path = os.path.join(
+            os.path.dirname(path), "pts", os.path.basename(path) + ".npy"
+        )
+        pts = np.load(npy_path)
+        return pts
+
+    @staticmethod
+    def cam_pose_transformation(cam_pose_before):
+        offset = np.asarray([[1, 0, 0, 0], [0, -1, 0, 0], [0, 0, -1, 0], [0, 0, 0, 1]])
+        cam_pose_after = cam_pose_before @ offset
+        return cam_pose_after
+
+    @staticmethod
+    def load_cam_info(path, binocular=False, display_table_as_world_space_origin=True):
+        scene_dir = os.path.dirname(path)
+        root_dir = os.path.dirname(scene_dir)
+        scene_name = os.path.basename(scene_dir)
+        camera_params_path = os.path.join(
+            os.path.dirname(path), "camera_params", os.path.basename(path) + ".json"
+        )
+        with open(camera_params_path, "r") as f:
+            label_data = json.load(f)
+        cam_to_world = np.asarray(label_data["extrinsic"])
+        cam_to_world = DataLoadUtil.cam_pose_transformation(cam_to_world)
+        world_to_display_table = np.eye(4)
+        world_to_display_table[:3, 3] = -DataLoadUtil.get_display_table_top(
+            root_dir, scene_name
+        )
+        if display_table_as_world_space_origin:
+            cam_to_world = np.dot(world_to_display_table, cam_to_world)
+        cam_intrinsic = np.asarray(label_data["intrinsic"])
+        cam_info = {
+            "cam_to_world": cam_to_world,
+            "cam_intrinsic": cam_intrinsic,
+            "far_plane": label_data["far_plane"],
+            "near_plane": label_data["near_plane"],
+        }
+        if binocular:
+            cam_to_world_R = np.asarray(label_data["extrinsic_R"])
+            cam_to_world_R = DataLoadUtil.cam_pose_transformation(cam_to_world_R)
+            cam_to_world_O = np.asarray(label_data["extrinsic_cam_object"])
+            cam_to_world_O = DataLoadUtil.cam_pose_transformation(cam_to_world_O)
+            if display_table_as_world_space_origin:
+                cam_to_world_O = np.dot(world_to_display_table, cam_to_world_O)
+                cam_to_world_R = np.dot(world_to_display_table, cam_to_world_R)
+            cam_info["cam_to_world_O"] = cam_to_world_O
+            cam_info["cam_to_world_R"] = cam_to_world_R
+        return cam_info
+
+    @staticmethod
+    def get_real_cam_O_from_cam_L(
+        cam_L, cam_O_to_cam_L, scene_path, display_table_as_world_space_origin=True
+    ):
+        root_dir = os.path.dirname(scene_path)
+        scene_name = os.path.basename(scene_path)
+        if isinstance(cam_L, torch.Tensor):
+            cam_L = cam_L.cpu().numpy()
+        nO_to_display_table_pose = cam_L @ cam_O_to_cam_L
+        if display_table_as_world_space_origin:
+            display_table_to_world = np.eye(4)
+            display_table_to_world[:3, 3] = DataLoadUtil.get_display_table_top(
+                root_dir, scene_name
+            )
+            nO_to_world_pose = np.dot(display_table_to_world, nO_to_display_table_pose)
+        nO_to_world_pose = DataLoadUtil.cam_pose_transformation(nO_to_world_pose)
+        return nO_to_world_pose
+
+    @staticmethod
+    def get_target_point_cloud(
+        depth, cam_intrinsic, cam_extrinsic, mask, target_mask_label=(0, 255, 0, 255), require_full_points=False
+    ):
+        h, w = depth.shape
+        i, j = np.meshgrid(np.arange(w), np.arange(h), indexing="xy")
+
+        z = depth
+        x = (i - cam_intrinsic[0, 2]) * z / cam_intrinsic[0, 0]
+        y = (j - cam_intrinsic[1, 2]) * z / cam_intrinsic[1, 1]
+
+        points_camera = np.stack((x, y, z), axis=-1).reshape(-1, 3)
+        mask = mask.reshape(-1, 4)
+
+        target_mask = (mask == target_mask_label).all(axis=-1)
+
+        target_points_camera = points_camera[target_mask]
+        target_points_camera_aug = np.concatenate(
+            [target_points_camera, np.ones((target_points_camera.shape[0], 1))], axis=-1
+        )
+
+        target_points_world = np.dot(cam_extrinsic, target_points_camera_aug.T).T[:, :3]
+        data = {
+            "points_world": target_points_world,
+            "points_camera": target_points_camera,
+        }
+        return data
+
+    @staticmethod
+    def get_point_cloud(depth, cam_intrinsic, cam_extrinsic):
+        h, w = depth.shape
+        i, j = np.meshgrid(np.arange(w), np.arange(h), indexing="xy")
+
+        z = depth
+        x = (i - cam_intrinsic[0, 2]) * z / cam_intrinsic[0, 0]
+        y = (j - cam_intrinsic[1, 2]) * z / cam_intrinsic[1, 1]
+
+        points_camera = np.stack((x, y, z), axis=-1).reshape(-1, 3)
+        points_camera_aug = np.concatenate(
+            [points_camera, np.ones((points_camera.shape[0], 1))], axis=-1
+        )
+
+        points_world = np.dot(cam_extrinsic, points_camera_aug.T).T[:, :3]
+        return {"points_world": points_world, "points_camera": points_camera}
+
+    @staticmethod
+    def get_target_point_cloud_world_from_path(
+        path,
+        binocular=False,
+        random_downsample_N=65536,
+        voxel_size=0.005,
+        target_mask_label=(0, 255, 0, 255),
+        display_table_mask_label=(0, 0, 255, 255),
+        get_display_table_pts=False,
+        require_normal=False,
+    ):
+        cam_info = DataLoadUtil.load_cam_info(path, binocular=binocular)
+        if binocular:
+            depth_L, depth_R = DataLoadUtil.load_depth(
+                path, cam_info["near_plane"], cam_info["far_plane"], binocular=True
+            )
+            mask_L, mask_R = DataLoadUtil.load_seg(path, binocular=True)
+            point_cloud_L = DataLoadUtil.get_target_point_cloud(
+                depth_L,
+                cam_info["cam_intrinsic"],
+                cam_info["cam_to_world"],
+                mask_L,
+                target_mask_label,
+            )["points_world"]
+            point_cloud_R = DataLoadUtil.get_target_point_cloud(
+                depth_R,
+                cam_info["cam_intrinsic"],
+                cam_info["cam_to_world_R"],
+                mask_R,
+                target_mask_label,
+            )["points_world"]
+            point_cloud_L = PtsUtil.random_downsample_point_cloud(
+                point_cloud_L, random_downsample_N
+            )
+            point_cloud_R = PtsUtil.random_downsample_point_cloud(
+                point_cloud_R, random_downsample_N
+            )
+            overlap_points = PtsUtil.get_overlapping_points(
+                point_cloud_L, point_cloud_R, voxel_size
+            )
+            return overlap_points
+        else:
+            depth = DataLoadUtil.load_depth(
+                path, cam_info["near_plane"], cam_info["far_plane"]
+            )
+            mask = DataLoadUtil.load_seg(path)
+            point_cloud = DataLoadUtil.get_target_point_cloud(
+                depth, cam_info["cam_intrinsic"], cam_info["cam_to_world"], mask
+            )["points_world"]
+            return point_cloud
+
+    @staticmethod
+    def load_points_normals(root, scene_name, display_table_as_world_space_origin=True):
+        points_path = os.path.join(root, scene_name, "points_and_normals.txt")
+        points_normals = np.loadtxt(points_path)
+        if display_table_as_world_space_origin:
+            points_normals[:, :3] = points_normals[
+                :, :3
+            ] - DataLoadUtil.get_display_table_top(root, scene_name)
+        return points_normals
--- a/utils/preprocess_util.py
+++ b/utils/preprocess_util.py
@@ -0,0 +1,222 @@
+import os
+import numpy as np
+import time
+import sys
+np.random.seed(0)
+sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from utils.reconstruction_util import ReconstructionUtil
+from utils.data_load import DataLoadUtil
+from utils.pts_util import PtsUtil
+from PytorchBoot.utils.log_util import Log
+
+def save_np_pts(path, pts: np.ndarray, file_type="txt"):
+    if file_type == "txt":
+        np.savetxt(path, pts)
+    else:
+        np.save(path, pts)
+
+def save_target_points(root, scene, frame_idx, target_points: np.ndarray, file_type="txt"):
+    pts_path = os.path.join(root,scene, "pts", f"{frame_idx}.{file_type}")
+    if not os.path.exists(os.path.join(root,scene, "pts")):
+        os.makedirs(os.path.join(root,scene, "pts"))
+    save_np_pts(pts_path, target_points, file_type)
+    
+def save_scan_points_indices(root, scene, frame_idx, scan_points_indices: np.ndarray, file_type="txt"):
+    file_type="npy"
+    indices_path = os.path.join(root,scene, "scan_points_indices", f"{frame_idx}.{file_type}")
+    if not os.path.exists(os.path.join(root,scene, "scan_points_indices")):
+        os.makedirs(os.path.join(root,scene, "scan_points_indices"))
+    save_np_pts(indices_path, scan_points_indices, file_type)
+
+def save_scan_points(root, scene, scan_points: np.ndarray):
+    scan_points_path = os.path.join(root,scene, "scan_points.txt")
+    save_np_pts(scan_points_path, scan_points)
+
+def get_world_points(depth, mask, cam_intrinsic, cam_extrinsic, random_downsample_N):
+    z = depth[mask]
+    i, j = np.nonzero(mask)
+    x = (j - cam_intrinsic[0, 2]) * z / cam_intrinsic[0, 0]
+    y = (i - cam_intrinsic[1, 2]) * z / cam_intrinsic[1, 1]
+
+    points_camera = np.stack((x, y, z), axis=-1).reshape(-1, 3)
+    sampled_target_points = PtsUtil.random_downsample_point_cloud(
+                points_camera, random_downsample_N
+            )
+    points_camera_aug = np.concatenate((sampled_target_points, np.ones((sampled_target_points.shape[0], 1))), axis=-1)
+    points_camera_world = np.dot(cam_extrinsic, points_camera_aug.T).T[:, :3]
+    
+    return points_camera_world
+
+def get_scan_points_indices(scan_points, mask, display_table_mask_label, cam_intrinsic, cam_extrinsic):
+    scan_points_homogeneous = np.hstack((scan_points, np.ones((scan_points.shape[0], 1))))
+    points_camera = np.dot(np.linalg.inv(cam_extrinsic), scan_points_homogeneous.T).T[:, :3]
+    points_image_homogeneous = np.dot(cam_intrinsic, points_camera.T).T
+    points_image_homogeneous /= points_image_homogeneous[:, 2:]
+    pixel_x = points_image_homogeneous[:, 0].astype(int)
+    pixel_y = points_image_homogeneous[:, 1].astype(int)
+    h, w = mask.shape[:2]
+    valid_indices = (pixel_x >= 0) & (pixel_x < w) & (pixel_y >= 0) & (pixel_y < h)
+    mask_colors = mask[pixel_y[valid_indices], pixel_x[valid_indices]]
+    selected_points_indices = np.where((mask_colors == display_table_mask_label).all(axis=-1))[0]
+    selected_points_indices = np.where(valid_indices)[0][selected_points_indices]
+    return selected_points_indices
+
+def save_scene_data(root, scene, file_type="txt"):
+    
+    ''' configuration '''
+    target_mask_label = (0, 255, 0, 255)
+    display_table_mask_label=(0, 0, 255, 255)
+    random_downsample_N = 32768
+    voxel_size=0.002
+    filter_degree = 75
+    min_z = 0.25
+    max_z = 0.5
+    
+    ''' scan points '''
+    display_table_info = DataLoadUtil.get_display_table_info(root, scene)
+    radius = display_table_info["radius"]
+    
+    scan_points = np.asarray(ReconstructionUtil.generate_scan_points(display_table_top=0,display_table_radius=radius))
+    
+    ''' read frame data(depth|mask|normal) '''
+    frame_num = DataLoadUtil.get_scene_seq_length(root, scene)
+    for frame_id in range(frame_num):
+        Log.info(f"frame({frame_id}/{frame_num})]Processing {scene} frame {frame_id}")
+        path = DataLoadUtil.get_path(root, scene, frame_id)
+        cam_info = DataLoadUtil.load_cam_info(path, binocular=True)
+        depth_L, depth_R = DataLoadUtil.load_depth(
+                path, cam_info["near_plane"], 
+                cam_info["far_plane"], 
+                binocular=True
+            )
+        mask_L, mask_R = DataLoadUtil.load_seg(path, binocular=True)
+        
+        ''' target points '''
+        mask_img_L = mask_L
+        mask_img_R = mask_R
+
+        target_mask_img_L = (mask_L == target_mask_label).all(axis=-1)
+        target_mask_img_R = (mask_R == target_mask_label).all(axis=-1)
+
+        
+        sampled_target_points_L = get_world_points(depth_L, target_mask_img_L, cam_info["cam_intrinsic"], cam_info["cam_to_world"], random_downsample_N)
+        sampled_target_points_R = get_world_points(depth_R, target_mask_img_R, cam_info["cam_intrinsic"], cam_info["cam_to_world_R"], random_downsample_N)
+
+
+        has_points = sampled_target_points_L.shape[0] > 0 and sampled_target_points_R.shape[0] > 0
+        if has_points:
+            target_points = PtsUtil.get_overlapping_points(
+                    sampled_target_points_L, sampled_target_points_R, voxel_size
+                )
+
+        if has_points:
+            has_points = target_points.shape[0] > 0
+
+        if has_points:
+            points_normals = DataLoadUtil.load_points_normals(root, scene, display_table_as_world_space_origin=True)
+            target_points = PtsUtil.filter_points(
+                target_points, points_normals, cam_info["cam_to_world"],voxel_size=0.002, theta = filter_degree, z_range=(min_z, max_z)
+                )
+
+
+        ''' scan points indices '''
+        scan_points_indices_L = get_scan_points_indices(scan_points, mask_img_L, display_table_mask_label, cam_info["cam_intrinsic"], cam_info["cam_to_world"]) 
+        scan_points_indices_R = get_scan_points_indices(scan_points, mask_img_R, display_table_mask_label, cam_info["cam_intrinsic"], cam_info["cam_to_world_R"])
+        scan_points_indices = np.intersect1d(scan_points_indices_L, scan_points_indices_R)
+        
+        if not has_points:
+            target_points = np.zeros((0, 3))
+            
+        save_target_points(root, scene, frame_id, target_points, file_type=file_type)
+        save_scan_points_indices(root, scene, frame_id, scan_points_indices, file_type=file_type)
+    
+    save_scan_points(root, scene, scan_points) # The "done" flag of scene preprocess
+
+def process_frame(frame_id, root, scene, scan_points, file_type, target_mask_label, display_table_mask_label, random_downsample_N, voxel_size, filter_degree, min_z, max_z):
+    Log.info(f"[frame({frame_id})]Processing {scene} frame {frame_id}")
+    path = DataLoadUtil.get_path(root, scene, frame_id)
+    cam_info = DataLoadUtil.load_cam_info(path, binocular=True)
+    depth_L, depth_R = DataLoadUtil.load_depth(
+            path, cam_info["near_plane"], 
+            cam_info["far_plane"], 
+            binocular=True
+        )
+    mask_L, mask_R = DataLoadUtil.load_seg(path, binocular=True)
+
+    target_mask_img_L = (mask_L == target_mask_label).all(axis=-1)
+    target_mask_img_R = (mask_R == target_mask_label).all(axis=-1)
+
+    sampled_target_points_L = get_world_points(depth_L, target_mask_img_L, cam_info["cam_intrinsic"], cam_info["cam_to_world"], random_downsample_N)
+    sampled_target_points_R = get_world_points(depth_R, target_mask_img_R, cam_info["cam_intrinsic"], cam_info["cam_to_world_R"], random_downsample_N)
+
+    has_points = sampled_target_points_L.shape[0] > 0 and sampled_target_points_R.shape[0] > 0
+    target_points = np.zeros((0, 3))
+
+    if has_points:
+        target_points = PtsUtil.get_overlapping_points(sampled_target_points_L, sampled_target_points_R, voxel_size)
+
+    if has_points and target_points.shape[0] > 0:
+        points_normals = DataLoadUtil.load_points_normals(root, scene, display_table_as_world_space_origin=True)
+        target_points = PtsUtil.filter_points(
+            target_points, points_normals, cam_info["cam_to_world"], voxel_size=0.002, theta=filter_degree, z_range=(min_z, max_z)
+        )
+
+    scan_points_indices_L = get_scan_points_indices(scan_points, mask_L, display_table_mask_label, cam_info["cam_intrinsic"], cam_info["cam_to_world"]) 
+    scan_points_indices_R = get_scan_points_indices(scan_points, mask_R, display_table_mask_label, cam_info["cam_intrinsic"], cam_info["cam_to_world_R"])
+    scan_points_indices = np.intersect1d(scan_points_indices_L, scan_points_indices_R)
+
+    save_target_points(root, scene, frame_id, target_points, file_type=file_type)
+    save_scan_points_indices(root, scene, frame_id, scan_points_indices, file_type=file_type)
+
+def save_scene_data_multithread(root, scene, file_type="txt"):
+    target_mask_label = (0, 255, 0, 255)
+    display_table_mask_label = (0, 0, 255, 255)
+    random_downsample_N = 32768
+    voxel_size = 0.002
+    filter_degree = 75
+    min_z = 0.2
+    max_z = 0.5
+
+    display_table_info = DataLoadUtil.get_display_table_info(root, scene)
+    radius = display_table_info["radius"]
+    scan_points = np.asarray(ReconstructionUtil.generate_scan_points(display_table_top=0, display_table_radius=radius))
+    frame_num = DataLoadUtil.get_scene_seq_length(root, scene)
+
+    with ThreadPoolExecutor() as executor:
+        futures = {executor.submit(process_frame, frame_id, root, scene, scan_points, file_type, target_mask_label, display_table_mask_label, random_downsample_N, voxel_size, filter_degree, min_z, max_z): frame_id for frame_id in range(frame_num)}
+        
+        for future in as_completed(futures):
+            frame_id = futures[future]
+            try:
+                future.result()
+            except Exception as e:
+                Log.error(f"Error processing frame {frame_id}: {e}")
+
+    save_scan_points(root, scene, scan_points)  # The "done" flag of scene preprocess
+
+
+
+if __name__ == "__main__":
+    #root = "/media/hofee/repository/new_data_with_normal"
+    root = r"/media/hofee/data/tempdir/test_real_output"
+    # list_path = r"/media/hofee/repository/full_list.txt"
+    # scene_list = []
+    
+    # with open(list_path, "r") as f:
+    #     for line in f:
+    #         scene_list.append(line.strip())
+    scene_list = os.listdir(root)
+    from_idx = 0 # 1000
+    to_idx = 1 # 1500
+
+
+    cnt = 0
+    import time
+    total = to_idx - from_idx
+    for scene in scene_list[from_idx:to_idx]:
+        start = time.time()
+        save_scene_data(root, scene, cnt, total, file_type="npy")
+        cnt+=1
+        end = time.time()
+        print(f"Time cost: {end-start}")
--- a/utils/pts_util.py
+++ b/utils/pts_util.py
@@ -3,6 +3,7 @@ import open3d as o3d
 import torch
 import trimesh
 from scipy.spatial import cKDTree
+from utils.pose_util import PoseUtil


 class PtsUtil:
@@ -92,7 +93,7 @@ class PtsUtil:
        cam_pose,
        voxel_size=0.002,
        theta=45,
-        z_range=(0.2, 0.45),
+        z_range=(0.25, 0.5),
    ):
        """filter with z range"""
        points_cam = PtsUtil.transform_point_cloud(points, np.linalg.inv(cam_pose))
@@ -116,6 +117,98 @@ class PtsUtil:
        filtered_sampled_points = sampled_points[idx]
        return filtered_sampled_points[:, :3]

+    @staticmethod
+    def multi_scale_icp(
+        source, target, voxel_size_range, init_transformation=None, steps=20
+    ):
+        pipreg = o3d.pipelines.registration
+
+        if init_transformation is not None:
+            current_transformation = init_transformation
+        else:
+            current_transformation = np.identity(4)
+        cnt = 0
+        best_score = 1e10
+        best_reg = None
+        voxel_sizes = []
+        for i in range(steps):
+            voxel_sizes.append(
+                voxel_size_range[0]
+                + i * (voxel_size_range[1] - voxel_size_range[0]) / steps
+            )
+
+        for voxel_size in voxel_sizes:
+            radius_normal = voxel_size * 2
+            source_downsampled = source.voxel_down_sample(voxel_size)
+            source_downsampled.estimate_normals(
+                search_param=o3d.geometry.KDTreeSearchParamHybrid(
+                    radius=radius_normal, max_nn=30
+                )
+            )
+            target_downsampled = target.voxel_down_sample(voxel_size)
+            target_downsampled.estimate_normals(
+                search_param=o3d.geometry.KDTreeSearchParamHybrid(
+                    radius=radius_normal, max_nn=30
+                )
+            )
+
+            reg_icp = pipreg.registration_icp(
+                source_downsampled,
+                target_downsampled,
+                voxel_size * 2,
+                current_transformation,
+                pipreg.TransformationEstimationPointToPlane(),
+                pipreg.ICPConvergenceCriteria(max_iteration=500),
+            )
+            cnt += 1
+            if reg_icp.fitness == 0:
+                score = 1e10
+            else:
+                score = reg_icp.inlier_rmse / reg_icp.fitness
+            
+            if score < best_score:
+                best_score = score
+                best_reg = reg_icp
+
+        return best_reg, best_score
+
+    @staticmethod
+    def multi_scale_ransac(source_downsampled, target_downsampled, source_fpfh, model_fpfh, voxel_size_range, steps=20):
+        pipreg = o3d.pipelines.registration
+        cnt = 0
+        best_score = 1e10
+        best_reg = None
+        voxel_sizes = []
+        for i in range(steps):
+            voxel_sizes.append(
+                voxel_size_range[0]
+                + i * (voxel_size_range[1] - voxel_size_range[0]) / steps
+            )
+
+        for voxel_size in voxel_sizes:
+            reg_ransac = pipreg.registration_ransac_based_on_feature_matching(
+                source_downsampled,
+                target_downsampled,
+                source_fpfh,
+                model_fpfh,
+                mutual_filter=True,
+                max_correspondence_distance=voxel_size*2,
+                estimation_method=pipreg.TransformationEstimationPointToPoint(False),
+                ransac_n=4,
+                checkers=[pipreg.CorrespondenceCheckerBasedOnEdgeLength(0.9)],
+                criteria=pipreg.RANSACConvergenceCriteria(8000000, 500),
+            )
+            cnt += 1
+            if reg_ransac.fitness == 0:
+                score = 1e10
+            else:
+                score = reg_ransac.inlier_rmse / reg_ransac.fitness
+            if score < best_score:
+                best_score = score
+                best_reg = reg_ransac
+
+        return best_reg, best_score
+
    @staticmethod
    def register(pcl: np.ndarray, model: trimesh.Trimesh, voxel_size=0.01):
        radius_normal = voxel_size * 2
@@ -146,26 +239,41 @@ class PtsUtil:
            o3d.geometry.KDTreeSearchParamHybrid(radius=radius_normal, max_nn=100),
        )

-        reg_ransac = pipreg.registration_ransac_based_on_feature_matching(
+        reg_ransac, ransac_best_score = PtsUtil.multi_scale_ransac(
            source_downsampled,
            model_downsampled,
            source_fpfh,
            model_fpfh,
-            mutual_filter=True,
-            max_correspondence_distance=voxel_size * 1.5,
-            estimation_method=pipreg.TransformationEstimationPointToPoint(False),
-            ransac_n=4,
-            checkers=[pipreg.CorrespondenceCheckerBasedOnEdgeLength(0.9)],
-            criteria=pipreg.RANSACConvergenceCriteria(4000000, 500),
+            voxel_size_range=(0.03, 0.005),
+            steps=3,
        )
-        
-        reg_icp = pipreg.registration_icp(
+        reg_icp, icp_best_score = PtsUtil.multi_scale_icp(
            source_downsampled,
            model_downsampled,
-            voxel_size * 2,
-            reg_ransac.transformation,
-            pipreg.TransformationEstimationPointToPlane(),
-            pipreg.ICPConvergenceCriteria(max_iteration=200),
+            voxel_size_range=(0.02, 0.001),
+            init_transformation=reg_ransac.transformation,
+            steps=50,
        )
-        
        return reg_icp.transformation
+    
+    @staticmethod
+    def get_pts_from_depth(depth, cam_intrinsic, cam_extrinsic):
+        h, w = depth.shape
+        i, j = np.meshgrid(np.arange(w), np.arange(h), indexing="xy")
+
+        z = depth
+        x = (i - cam_intrinsic[0, 2]) * z / cam_intrinsic[0, 0]
+        y = (j - cam_intrinsic[1, 2]) * z / cam_intrinsic[1, 1]
+
+        points_camera = np.stack((x, y, z), axis=-1).reshape(-1, 3)
+        mask = mask.reshape(-1, 4)
+        points_camera = np.concatenate(
+            [points_camera, np.ones((points_camera.shape[0], 1))], axis=-1
+        )
+
+        points_world = np.dot(cam_extrinsic, points_camera.T).T[:, :3]
+        data = {
+            "points_world": points_world,
+            "points_camera": points_camera,
+        }
+        return data
--- a/utils/reconstruction_util.py
+++ b/utils/reconstruction_util.py
@@ -8,20 +8,19 @@ class ReconstructionUtil:
    def compute_coverage_rate(target_point_cloud, combined_point_cloud, threshold=0.01):
        kdtree = cKDTree(combined_point_cloud)
        distances, _ = kdtree.query(target_point_cloud)
-        covered_points_num = np.sum(distances < threshold)
+        covered_points_num = np.sum(distances < threshold*2)
        coverage_rate = covered_points_num / target_point_cloud.shape[0]
        return coverage_rate, covered_points_num
    
    @staticmethod
-    def compute_overlap_rate(new_point_cloud, combined_point_cloud, threshold=0.01):
+    def check_overlap(new_point_cloud, combined_point_cloud, overlap_area_threshold=25, voxel_size=0.01):
        kdtree = cKDTree(combined_point_cloud)
        distances, _ = kdtree.query(new_point_cloud)
-        overlapping_points = np.sum(distances < threshold)
-        if new_point_cloud.shape[0] == 0:
-            overlap_rate = 0
-        else:
-            overlap_rate = overlapping_points / new_point_cloud.shape[0]
-        return overlap_rate
+        overlapping_points = np.sum(distances < voxel_size*2)
+        cm = 0.01
+        voxel_size_cm = voxel_size / cm
+        overlap_area = overlapping_points * voxel_size_cm * voxel_size_cm
+        return overlap_area > overlap_area_threshold


    @staticmethod
@@ -121,7 +120,37 @@ class ReconstructionUtil:
            sm.set_progress(app_name, runner_name, "processed view", len(point_cloud_list), len(point_cloud_list))
        return view_sequence, remaining_views, combined_point_cloud

-    
+    @staticmethod
+    def compute_next_best_view_with_overlap(scanned_pts, point_cloud_list, history_indices, scan_points_indices_list, threshold=0.01, overlap_area_threshold=25, scan_points_threshold=5):
+        max_rec_pts = np.vstack(point_cloud_list)
+        downsampled_max_rec_pts = PtsUtil.voxel_downsample_point_cloud(max_rec_pts, threshold)
+        best_view = None
+        best_coverage = -1
+        best_covered_num = 0
+        for view in range(len(point_cloud_list)):
+            if point_cloud_list[view].shape[0] == 0:
+                continue
+            new_scan_points_indices = scan_points_indices_list[view]
+            
+            if not ReconstructionUtil.check_scan_points_overlap(history_indices, new_scan_points_indices, scan_points_threshold):
+                curr_overlap_area_threshold = overlap_area_threshold
+            else:
+                curr_overlap_area_threshold = overlap_area_threshold * 0.5
+                
+            if not ReconstructionUtil.check_overlap(point_cloud_list[view], scanned_pts, overlap_area_threshold = curr_overlap_area_threshold, voxel_size=threshold):
+                continue
+            
+            
+            new_combined_point_cloud = np.vstack([scanned_pts ,point_cloud_list[view]])
+            new_downsampled_combined_point_cloud = PtsUtil.voxel_downsample_point_cloud(new_combined_point_cloud,threshold)
+            new_coverage, new_covered_num = ReconstructionUtil.compute_coverage_rate(downsampled_max_rec_pts, new_downsampled_combined_point_cloud, threshold)
+            if new_coverage > best_coverage:
+                best_coverage = new_coverage
+                best_covered_num = new_covered_num
+                best_view = view
+                
+        return best_view, best_coverage, best_covered_num
+        
    @staticmethod
    def generate_scan_points(display_table_top, display_table_radius, min_distance=0.03, max_points_num = 500, max_attempts = 1000):
        points = []
@@ -152,9 +181,15 @@ class ReconstructionUtil:
    
    @staticmethod
    def check_scan_points_overlap(history_indices, indices2, threshold=5):
-        for indices1 in history_indices:
-            if len(set(indices1).intersection(set(indices2))) >= threshold:
-                return True
+        try:
+            if len(indices2) == 0:
+                return False
+            for indices1 in history_indices:
+                if len(set(indices1).intersection(set(indices2))) >= threshold:
+                    return True
+        except Exception as e:
+            print(e)
+            import ipdb; ipdb.set_trace()
        return False

        
--- a/utils/render_util.py
+++ b/utils/render_util.py
@@ -0,0 +1,45 @@
+
+import os
+import json
+import subprocess
+import tempfile
+import shutil
+from utils.data_load import DataLoadUtil
+from utils.pts_util import PtsUtil
+class RenderUtil:
+
+    @staticmethod
+    def render_pts(cam_pose, object_name, script_path, model_points_normals, voxel_threshold=0.005, filter_degree=75, nO_to_nL_pose=None, require_full_scene=False):
+        nO_to_world_pose = DataLoadUtil.get_real_cam_O_from_cam_L(cam_pose, nO_to_nL_pose, scene_path=scene_path)
+        with tempfile.TemporaryDirectory() as temp_dir:
+            params = {
+                "cam_pose": nO_to_world_pose.tolist(),
+                "object_name": scene_path
+            }
+            params_data_path = os.path.join(temp_dir, "params.json")
+            with open(params_data_path, 'w') as f:
+                json.dump(params, f)
+            result = subprocess.run([
+                'blender', '-b', '-P', script_path, '--', temp_dir
+            ], capture_output=True, text=True)
+            if result.returncode != 0:
+                print("Blender script failed:")
+                print(result.stderr)
+                return None
+            path = os.path.join(temp_dir, "tmp")
+            point_cloud = DataLoadUtil.get_target_point_cloud_world_from_path(path, binocular=True)
+            cam_params = DataLoadUtil.load_cam_info(path, binocular=True)
+            
+            filtered_point_cloud = PtsUtil.filter_points(point_cloud, model_points_normals, cam_pose=cam_params["cam_to_world"], voxel_size=voxel_threshold, theta=filter_degree)
+            full_scene_point_cloud = None
+            if require_full_scene:
+                depth_L, depth_R = DataLoadUtil.load_depth(path, cam_params['near_plane'], cam_params['far_plane'], binocular=True)
+                point_cloud_L = DataLoadUtil.get_point_cloud(depth_L, cam_params['cam_intrinsic'], cam_params['cam_to_world'])['points_world']
+                point_cloud_R = DataLoadUtil.get_point_cloud(depth_R, cam_params['cam_intrinsic'], cam_params['cam_to_world_R'])['points_world']
+            
+                point_cloud_L = PtsUtil.random_downsample_point_cloud(point_cloud_L, 65536)
+                point_cloud_R = PtsUtil.random_downsample_point_cloud(point_cloud_R, 65536)
+                full_scene_point_cloud = PtsUtil.get_overlapping_points(point_cloud_L, point_cloud_R)
+
+            
+            return filtered_point_cloud, full_scene_point_cloud
--- a/utils/view_sample_util.py
+++ b/utils/view_sample_util.py
@@ -1,162 +0,0 @@
-
-import numpy as np
-from utils.pose_util import PoseUtil
-import trimesh
-from collections import defaultdict
-from scipy.spatial.transform import Rotation as R
-import random
-
-class ViewSampleUtil:
-    @staticmethod
-    def farthest_point_sampling(points, num_samples):
-        num_points = points.shape[0]
-        if num_samples >= num_points:
-            return points, np.arange(num_points)
-        sampled_indices = np.zeros(num_samples, dtype=int)
-        sampled_indices[0] = np.random.randint(num_points)
-        min_distances = np.full(num_points, np.inf)
-        for i in range(1, num_samples):
-            current_point = points[sampled_indices[i - 1]]
-            dist_to_current_point = np.linalg.norm(points - current_point, axis=1)
-            min_distances = np.minimum(min_distances, dist_to_current_point)
-            sampled_indices[i] = np.argmax(min_distances)
-        downsampled_points = points[sampled_indices]
-        return downsampled_points, sampled_indices
-    
-    @staticmethod
-    def voxel_downsample(points, voxel_size):
-        voxel_grid = defaultdict(list)
-        for i, point in enumerate(points):
-            voxel_index = tuple((point // voxel_size).astype(int))
-            voxel_grid[voxel_index].append(i)
-
-        downsampled_points = []
-        downsampled_indices = []
-        for indices in voxel_grid.values():
-            selected_index = indices[0]
-            downsampled_points.append(points[selected_index])
-            downsampled_indices.append(selected_index)
-
-        return np.array(downsampled_points), downsampled_indices
-
-    @staticmethod
-    def sample_view_data(mesh: trimesh.Trimesh, distance_range: tuple = (0.25, 0.5), voxel_size: float = 0.005, max_views: int = 1, pertube_repeat: int = 1) -> dict:
-        view_data = {
-            "look_at_points": [],
-            "cam_positions": [],
-        }
-
-        vertices = mesh.vertices
-        look_at_points = []
-        cam_positions = []
-        normals = []
-        vertex_normals = mesh.vertex_normals
-
-        for i, vertex in enumerate(vertices):
-            look_at_point = vertex
-            
-            view_data["look_at_points"].append(look_at_point)
-
-            normal = vertex_normals[i]
-            if np.isnan(normal).any():
-                continue
-            if np.dot(normal, look_at_point) < 0:
-                normal = -normal
-            
-            normals.append(normal)
-
-            for _ in range(pertube_repeat):
-                perturb_angle = np.radians(np.random.uniform(0, 30))
-                perturb_axis = np.random.normal(size=3)
-                perturb_axis /= np.linalg.norm(perturb_axis)
-                rotation_matrix = R.from_rotvec(perturb_angle * perturb_axis).as_matrix()
-                perturbed_normal = np.dot(rotation_matrix, normal)
-
-                distance = np.random.uniform(*distance_range)
-                cam_position = look_at_point + distance * perturbed_normal
-                look_at_points.append(look_at_point)
-                cam_positions.append(cam_position)
-
-        look_at_points = np.array(look_at_points)
-        cam_positions = np.array(cam_positions)
-
-        voxel_downsampled_look_at_points, selected_indices = ViewSampleUtil.voxel_downsample(look_at_points, voxel_size)
-        voxel_downsampled_cam_positions = cam_positions[selected_indices]
-        voxel_downsampled_normals = np.array(normals)[selected_indices]
-
-        fps_downsampled_look_at_points, selected_indices = ViewSampleUtil.farthest_point_sampling(voxel_downsampled_look_at_points, max_views * 2)
-        fps_downsampled_cam_positions = voxel_downsampled_cam_positions[selected_indices]
-
-        view_data["look_at_points"] = fps_downsampled_look_at_points.tolist()
-        view_data["cam_positions"] = fps_downsampled_cam_positions.tolist()
-        view_data["normals"] = voxel_downsampled_normals.tolist()
-        view_data["voxel_down_sampled_points"] = voxel_downsampled_look_at_points 
-
-        return view_data
-    
-    @staticmethod
-    def get_world_points_and_normals(view_data: dict, obj_world_pose: np.ndarray) -> tuple:
-        world_points = []
-        world_normals = []
-        for voxel_down_sampled_points, normal in zip(view_data["voxel_down_sampled_points"], view_data["normals"]):
-            voxel_down_sampled_points_world = obj_world_pose @ np.append(voxel_down_sampled_points, 1.0)
-            normal_world = obj_world_pose[:3, :3] @ normal
-            world_points.append(voxel_down_sampled_points_world[:3])
-            world_normals.append(normal_world)
-        return np.array(world_points), np.array(world_normals)
-    
-    @staticmethod
-    def get_cam_pose(view_data: dict, obj_world_pose: np.ndarray, max_views: int, min_cam_table_included_degree: int, random_view_ratio: float) -> np.ndarray:
-        cam_poses = []
-        min_height_z = 1000
-        for look_at_point, cam_position in zip(view_data["look_at_points"], view_data["cam_positions"]):
-            look_at_point_world = obj_world_pose @ np.append(look_at_point, 1.0)
-            cam_position_world = obj_world_pose @ np.append(cam_position, 1.0)
-            if look_at_point_world[2] < min_height_z:
-                min_height_z = look_at_point_world[2]
-            look_at_point_world = look_at_point_world[:3]  
-            cam_position_world = cam_position_world[:3]    
-            
-            forward_vector = cam_position_world - look_at_point_world
-            forward_vector /= np.linalg.norm(forward_vector)
-            
-            up_vector = np.array([0, 0, 1])
-
-            right_vector = np.cross(up_vector, forward_vector)
-            right_vector /= np.linalg.norm(right_vector)
-
-            corrected_up_vector = np.cross(forward_vector, right_vector)
-            rotation_matrix = np.array([right_vector, corrected_up_vector, forward_vector]).T
-
-            cam_pose = np.eye(4)
-            cam_pose[:3, :3] = rotation_matrix
-            cam_pose[:3, 3] = cam_position_world
-            cam_poses.append(cam_pose)
-
-        filtered_cam_poses = []
-        for cam_pose in cam_poses:
-            if cam_pose[2, 3] > min_height_z:
-                direction_vector = cam_pose[:3, 2]
-                horizontal_normal = np.array([0, 0, 1])  
-                cos_angle = np.dot(direction_vector, horizontal_normal) / (np.linalg.norm(direction_vector) * np.linalg.norm(horizontal_normal))
-                angle = np.arccos(np.clip(cos_angle, -1.0, 1.0))  
-                angle_degree = np.degrees(angle)
-                if angle_degree < 90 - min_cam_table_included_degree:
-                    filtered_cam_poses.append(cam_pose)
-                if random.random() < random_view_ratio:
-                    pertube_pose = PoseUtil.get_uniform_pose([0.1, 0.1, 0.1], [3, 3, 3], 0, 180, "cm")
-                    filtered_cam_poses.append(pertube_pose @ cam_pose)
-                    
-        if len(filtered_cam_poses) > max_views:
-            indices = np.random.choice(len(filtered_cam_poses), max_views, replace=False)
-            filtered_cam_poses = [filtered_cam_poses[i] for i in indices]
-            
-        return np.array(filtered_cam_poses)
-        
-    @staticmethod
-    def sample_view_data_world_space(mesh: trimesh.Trimesh, cad_to_world: np.ndarray, distance_range:tuple = (0.25,0.5), voxel_size:float = 0.005, max_views: int=1, min_cam_table_included_degree:int=20, random_view_ratio:float = 0.2) -> dict:
-        view_data = ViewSampleUtil.sample_view_data(mesh, distance_range, voxel_size, max_views)
-        view_data["cam_to_world_poses"] = ViewSampleUtil.get_cam_pose(view_data, cad_to_world, max_views, min_cam_table_included_degree, random_view_ratio)
-        view_data["voxel_down_sampled_points"], view_data["normals"] =  ViewSampleUtil.get_world_points_and_normals(view_data, cad_to_world)
-        return view_data
-    
--- a/utils/view_util.py
+++ b/utils/view_util.py
@@ -0,0 +1,127 @@
+import numpy as np
+from scipy.spatial.transform import Rotation as R
+from dataclasses import dataclass
+
+
+@dataclass
+class CameraIntrinsics:
+    width: int
+    height: int
+    fx: float
+    fy: float
+    cx: float
+    cy: float
+
+    @property
+    def intrinsic_matrix(self):
+        return np.array([[self.fx, 0, self.cx], [0, self.fy, self.cy], [0, 0, 1]])
+
+
+@dataclass
+class CameraExtrinsics:
+    def __init__(self, rotation: np.ndarray, translation: np.ndarray, rot_type: str):
+        """
+        rotation: 3x3 rotation matrix or 1x3 euler angles or 1x4 quaternion
+        translation: 1x3 or 3x1 translation vector
+        rot_type: "mat", "euler_xyz", "quat_xyzw"
+        """
+        assert rot_type in ["mat", "euler_xyz", "quat_xyzw"]
+        if rot_type == "mat":
+            self._rot = R.from_matrix(rotation)
+        elif rot_type == "euler_xyz":
+            self._rot = R.from_euler('xyz', rotation, degrees=True)
+        elif rot_type == "quat_xyzw":
+            self._rot = R.from_quat(rotation)
+        self._translation = translation
+
+    @property
+    def extrinsic_matrix(self):
+        return np.vstack([np.hstack([self._rot.as_matrix(), self._translation.reshape(3, 1)]), [0, 0, 0, 1]])
+    
+    @property
+    def rotation_euler_xyz(self):
+        return self._rot.as_euler('xyz', degrees=True)
+    
+    @property
+    def rotation_quat_xyzw(self):
+        return self._rot.as_quat()
+    
+    @property
+    def rotation_matrix(self):
+        return self._rot.as_matrix()
+    
+    @property
+    def translation(self):
+        return self._translation
+    
+
+@dataclass
+class CameraData:
+    def __init__(self, depth_image: np.ndarray, image_id: int, intrinsics: CameraIntrinsics, extrinsics: CameraExtrinsics):
+        self._depth_image = depth_image
+        self._image_id = image_id
+        self._intrinsics = intrinsics
+        self._extrinsics = extrinsics
+
+    @property
+    def depth_image(self):
+        return self._depth_image
+    
+    @property
+    def image_id(self):
+        return self._image_id
+    
+    @property
+    def intrinsics(self):
+        return self._intrinsics.intrinsic_matrix
+    
+    @property
+    def extrinsics(self):
+        return self._extrinsics.extrinsic_matrix
+    
+    @property
+    def projection_matrix(self):
+        return self.intrinsics @ self.extrinsics[:3, :4]
+    
+    @property
+    def pts_camera(self):
+        height, width = self.depth_image.shape
+        v, u = np.indices((height, width))
+        points = np.vstack([u.flatten(), v.flatten(), np.ones_like(u.flatten())]) # 3xN
+        points = np.linalg.inv(self.intrinsics) @ points                          # 3xN
+        points = points.T                                                         # Nx3
+        points = points * self.depth_image.flatten()[:, np.newaxis]               # Nx3
+        points = points[points[:, 2] > 0]                                         # Nx3
+        return points
+    
+    @property
+    def pts_world(self):
+        homogeneous_pts = np.hstack([self.pts_camera, np.ones((self.pts_camera.shape[0], 1))]) # Nx4
+        pts_world = self.extrinsics @ homogeneous_pts.T # 4xN
+        return pts_world[:3, :].T
+    
+class ViewUtil:
+    def get_pts(view_data):
+        image_id = view_data["image_id"]
+        depth_intrinsics = view_data["depth_intrinsics"]
+        depth_extrinsics = view_data["depth_extrinsics"]
+        depth_image = np.array(view_data["depth_image"], dtype=np.uint16)
+        if image_id is None:
+            return None
+        else:
+            camera_intrinsics = CameraIntrinsics(
+                depth_intrinsics['width'],
+                depth_intrinsics['height'],
+                depth_intrinsics['fx'], 
+                depth_intrinsics['fy'], 
+                depth_intrinsics['cx'], 
+                depth_intrinsics['cy']
+            )
+            camera_extrinsics = CameraExtrinsics(
+                depth_extrinsics[:3, :3], 
+                depth_extrinsics[:3, 3],
+                rot_type="mat"
+            )
+            camera_data = CameraData(depth_image, image_id, camera_intrinsics, camera_extrinsics)
+            pts = camera_data.pts_world
+        return pts/1000
--- a/vis_pts_and_nrm.py
+++ b/vis_pts_and_nrm.py
@@ -0,0 +1,54 @@
+# import numpy as np
+# import matplotlib.pyplot as plt
+# from mpl_toolkits.mplot3d import Axes3D
+
+# # 假设 points_and_normals 是你的 Nx6 矩阵
+# # 前三列是点坐标，后三列是法线
+# points_and_normals = np.loadtxt("/Users/hofee/Downloads/temp_output/cad_model_world/points_and_normals.txt")  # 这里用随机点代替你的数据
+# points = points_and_normals[:100, :3]
+# normals = points_and_normals[:100, 3:]
+
+# # 创建3D图形
+# fig = plt.figure()
+# ax = fig.add_subplot(111, projection='3d')
+
+# # 绘制点云
+# ax.scatter(points[:, 0], points[:, 1], points[:, 2], color='b', marker='o')
+
+# # 绘制法线 (从每个点出发的一小段箭头)
+# ax.quiver(points[:, 0], points[:, 1], points[:, 2],
+#           normals[:, 0], normals[:, 1], normals[:, 2], length=0.1, color='r')
+
+# plt.show()
+
+import numpy as np
+
+# 假设 points_and_normals 是你的 Nx6 矩阵
+# points_and_normals[:,:3] 是点的坐标
+# points_and_normals[:,3:] 是法线
+points_and_normals = np.loadtxt("/Users/hofee/Downloads/temp_output/cad_model_world/points_and_normals.txt")  # 这里用随机点代替你的数据
+print(points_and_normals.shape)
+points = points_and_normals[300:400, :3]
+normals = points_and_normals[300:400, 3:]
+
+# 设置你想在法线方向上采样的距离范围和点数
+num_samples_per_point = 20  # 每个法线方向采样的点数
+sampling_distances = np.linspace(0, 0.5, num_samples_per_point)  # 采样距离范围
+
+# 创建一个空列表来保存采样点
+sampled_points = []
+
+# 对每个点进行法线方向的采样
+for point, normal in zip(points, normals):
+    for dist in sampling_distances:
+        # 在法线方向上偏移点
+        sampled_point = point + dist * normal
+        sampled_points.append(sampled_point)
+
+# 转换为 numpy 数组
+sampled_points = np.array(sampled_points)
+
+# 保存为点云文件 (例如 .txt 或 .xyz 格式)
+np.savetxt('sampled_points.txt', sampled_points)
+
+print("采样点云已保存为 'sampled_points.xyz'")
Author	SHA1	Message	Date
hofee	307994c20d	update	2024-10-18 17:13:45 +08:00
hofee	20514be419	update displaytable rotation	2024-10-14 19:37:34 +08:00
hofee	2f87a2626c	update	2024-10-13 19:47:05 +08:00
hofee	41ee79db0c	update config	2024-10-13 15:24:41 +08:00
hofee	07dcdb3452	add close loop control	2024-10-12 23:11:25 +08:00
hofee	8d43d4de60	update	2024-10-12 20:25:55 +08:00
hofee	3fe74eb6eb	update	2024-10-12 16:39:00 +08:00
hofee	cd85fed3a0	update	2024-10-10 21:48:55 +08:00
hofee	8fd2d6b1e1	optimize	2024-10-10 15:13:40 +08:00
hofee	f6c4db859e	add multiprocess	2024-10-10 14:42:57 +08:00
hofee	ba36803fba	finish pipeline	2024-10-09 21:46:13 +08:00
hofee	f8514564c1	solve merge	2024-10-08 21:33:17 +08:00
hofee	3ab046b134	update	2024-10-08 21:28:30 +08:00