Skip to content

Commit 1e2b25b

Browse files
authored
Release new model, fix bugs and warnings (#52)
* Release temporal Maskgit of LiDAR generation * Fix video streaming generation due to the code change of temporal VAE * Fix security warning of transformers
1 parent 6eb4914 commit 1e2b25b

12 files changed

Lines changed: 412 additions & 48 deletions

.gitattributes

Lines changed: 0 additions & 1 deletion
This file was deleted.

README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -91,8 +91,8 @@ You can download our pre-trained tokenzier and generation model in the following
9191
| | nuscene, waymo, argoverse, kitti360 | [Config](configs/lidar/lidar_vqvae_nwak.json) | [checkpoint](http://103.237.29.236:10030/lidar_vqvae_nwak_80k.pth), [blank code](http://103.237.29.236:10030/lidar_vqvae_nwak_80k_blank_code.pkl) |
9292
| MaskGIT | nuscene | [Config](configs/lidar/lidar_maskgit_layout_ns.json) | [ckpt_with_vqvae_nwa](http://103.237.29.236:10030/lidar_maskgit_nusc_150k.pth) <br> [ckpt_with_vqvae_nwak](http://103.237.29.236:10030/lidar_maskgit_vq80k_layout_ns_120k.pth) |
9393
| | kitti360 | [Config](configs/lidar/lidar_maskgit_vq80k_layout_kt.json) | [checkpoint](http://103.237.29.236:10030/lidar_maskgit_vq80k_layout_kt_120k.pth)|
94-
| Temporal MaskGIT | nuscene | [Config](configs/lidar/lidar_maskgit_temporal_vq80k_layout_ns.json) | checkpoint(TODO) |
95-
| | kitti360 | [Config](configs/lidar/lidar_maskgit_temporal_vq80k_layout_kt.json) | checkpoint(TODO)|
94+
| Temporal MaskGIT | nuscene | [Config](configs/lidar/lidar_maskgit_temporal_vq80k_layout_ns.json) | [checkpoint](http://103.237.29.236:10030/lidar_maskgit_temporal_vq80k_layout_kt_150k.pth) |
95+
| | kitti360 | [Config](configs/lidar/lidar_maskgit_temporal_vq80k_layout_kt.json) | [checkpoint](http://103.237.29.236:10030/lidar_maskgit_temporal_vq80k_layout_ns_150k.pth)|
9696
## Examples
9797

9898
### T2I, T2V generation with CTSD pipeline

configs/lidar/lidar_maskgit_temporal_vq80k_layout_kt.json

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -622,6 +622,13 @@
622622
"persistent_workers": true
623623
},
624624
"informations": {
625-
"todo": "todo"
625+
"voxel_iou": 0.11702190,
626+
"chamfer_distance": 3.34721875,
627+
"chamfer_distance_30": 1.88547862,
628+
"chamfer_distance_40": 2.57636571,
629+
"mmd": 0.00411365,
630+
"jsd": 0.31335828,
631+
"total_batch_sizes": 24,
632+
"steps": 150000
626633
}
627634
}

configs/lidar/lidar_maskgit_temporal_vq80k_layout_ns.json

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -786,6 +786,11 @@
786786
"persistent_workers": true
787787
},
788788
"informations": {
789-
"todo": "todo"
789+
"voxel_iou": 0.12602140,
790+
"chamfer_distance": 3.48719001,
791+
"chamfer_distance_30": 1.59294820,
792+
"chamfer_distance_40": 2.51212931,
793+
"total_batch_sizes": 24,
794+
"steps": 150000
790795
}
791796
}

examples/lidar_maskgit_preview.json

Lines changed: 22 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -77,28 +77,28 @@
7777
"bias_init": -5.0
7878
},
7979
"bi_directional_Transformer": {
80-
"_class_name": "dwm.models.maskgit_model.BidirectionalTransformerWithAdapter",
81-
"use_extra_embedding": true,
82-
"n_e": 2048,
83-
"e_dim": 1024,
84-
"hidden_dim": 1280,
85-
"img_size": [
86-
80,
87-
80
88-
],
89-
"num_heads": 40,
90-
"use_checkpoint": true,
91-
"depth": 24,
92-
"condition_adapter": {
93-
"_class_name": "dwm.models.adapters.ImageAdapter",
94-
"in_channels": 6,
95-
"channels": [1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280],
96-
"downscale_factor": 8,
97-
"is_downblocks": [false, false, false, false, false, false, false, false],
98-
"use_zero_convs": true,
99-
"gradient_checkpointing": true
100-
}
101-
},
80+
"_class_name": "dwm.models.maskgit_model.BidirectionalTransformerWithAdapter",
81+
"use_extra_embedding": true,
82+
"n_e": 2048,
83+
"e_dim": 1024,
84+
"hidden_dim": 1280,
85+
"img_size": [
86+
80,
87+
80
88+
],
89+
"num_heads": 40,
90+
"use_checkpoint": true,
91+
"depth": 24,
92+
"condition_adapter": {
93+
"_class_name": "dwm.models.adapters.ImageAdapter",
94+
"in_channels": 6,
95+
"channels": [1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280],
96+
"downscale_factor": 8,
97+
"is_downblocks": [false, false, false, false, false, false, false, false],
98+
"use_zero_convs": true,
99+
"gradient_checkpointing": true
100+
}
101+
},
102102
"vq_point_cloud_ckpt_path": "/cache/aoss-v2.st-sh-01.sensecoreapi-oss.cn/users/wuzehuan/workspaces/worldmodels/models/lidar_vqvae_nwa_60k.pth",
103103
"vq_blank_code_path": "/cache/aoss-v2.st-sh-01.sensecoreapi-oss.cn/users/wuzehuan/workspaces/worldmodels/models/lidar_vqvae_nwa_60k_blank_code.pkl",
104104
"model_ckpt_path": "/mnt/storage/user/liuyichen/tasks/lidar_maskgit_nusc_full-align-line/checkpoints/150k.pth",

0 commit comments

Comments
 (0)