lyttt commited on
Commit
8a70e8e
·
verified ·
1 Parent(s): 5f5f46e

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. CausVid.egg-info/PKG-INFO +5 -0
  2. CausVid.egg-info/SOURCES.txt +7 -0
  3. CausVid.egg-info/dependency_links.txt +1 -0
  4. CausVid.egg-info/top_level.txt +1 -0
  5. configs/sdxl_8node_dmd_config.yaml +42 -0
  6. configs/wan_bidirectional_dmd.yaml +48 -0
  7. configs/wan_bidirectional_dmd_from_scratch.yaml +49 -0
  8. configs/wan_causal_dmd.yaml +53 -0
  9. configs/wan_causal_dmd_warp_4step_cfg2.yaml +54 -0
  10. configs/wan_causal_ode.yaml +31 -0
  11. output/wandb/run-20250908_063808-yfn0incq/files/output.log +26 -0
  12. output/wandb/run-20250908_063808-yfn0incq/files/requirements.txt +145 -0
  13. output/wandb/run-20250908_063808-yfn0incq/files/wandb-metadata.json +93 -0
  14. output/wandb/run-20250908_063808-yfn0incq/logs/debug-core.log +7 -0
  15. output/wandb/run-20250908_063808-yfn0incq/logs/debug-internal.log +6 -0
  16. output/wandb/run-20250908_063808-yfn0incq/logs/debug.log +22 -0
  17. output/wandb/run-20250908_063808-yfn0incq/run-yfn0incq.wandb +0 -0
  18. output/wandb/run-20250908_064634-xd44venm/files/wandb-metadata.json +93 -0
  19. output/wandb/run-20250908_064634-xd44venm/logs/debug-core.log +7 -0
  20. output/wandb/run-20250908_065643-lyib7g2q/files/output.log +25 -0
  21. output/wandb/run-20250908_065643-lyib7g2q/files/requirements.txt +145 -0
  22. output/wandb/run-20250908_065643-lyib7g2q/files/wandb-metadata.json +93 -0
  23. output/wandb/run-20250908_065643-lyib7g2q/logs/debug-core.log +7 -0
  24. output/wandb/run-20250908_065643-lyib7g2q/logs/debug-internal.log +6 -0
  25. output/wandb/run-20250908_065643-lyib7g2q/logs/debug.log +22 -0
  26. output/wandb/run-20250908_081933-xtabuxq1/files/config.yaml +159 -0
  27. output/wandb/run-20250908_081933-xtabuxq1/files/wandb-metadata.json +93 -0
  28. output/wandb/run-20250908_081933-xtabuxq1/logs/debug-core.log +14 -0
  29. output/wandb/run-20250908_081933-xtabuxq1/logs/debug.log +24 -0
  30. output/wandb/run-20250908_084516-b1cckt0e/logs/debug-core.log +7 -0
  31. output/wandb/run-20250908_084949-b9yvqkt5/files/config.yaml +160 -0
  32. output/wandb/run-20250908_084949-b9yvqkt5/files/output.log +94 -0
  33. output/wandb/run-20250908_084949-b9yvqkt5/files/requirements.txt +145 -0
  34. output/wandb/run-20250908_084949-b9yvqkt5/files/wandb-metadata.json +93 -0
  35. output/wandb/run-20250908_084949-b9yvqkt5/files/wandb-summary.json +1 -0
  36. output/wandb/run-20250908_084949-b9yvqkt5/logs/debug-core.log +14 -0
  37. output/wandb/run-20250908_084949-b9yvqkt5/logs/debug-internal.log +11 -0
  38. output/wandb/run-20250908_084949-b9yvqkt5/logs/debug.log +24 -0
  39. output/wandb/run-20250908_084949-b9yvqkt5/run-b9yvqkt5.wandb +0 -0
  40. output/wandb/run-20250908_085656-y8q57cbx/files/output.log +1 -0
  41. output/wandb/run-20250908_085656-y8q57cbx/files/requirements.txt +145 -0
  42. output/wandb/run-20250908_085656-y8q57cbx/files/wandb-metadata.json +93 -0
  43. output/wandb/run-20250908_085656-y8q57cbx/run-y8q57cbx.wandb +0 -0
  44. output/wandb/run-20250908_091534-f394z0xa/files/config.yaml +160 -0
  45. output/wandb/run-20250908_091534-f394z0xa/files/output.log +66 -0
  46. output/wandb/run-20250908_091534-f394z0xa/files/requirements.txt +145 -0
  47. output/wandb/run-20250908_091534-f394z0xa/files/wandb-metadata.json +93 -0
  48. output/wandb/run-20250908_091534-f394z0xa/files/wandb-summary.json +1 -0
  49. output/wandb/run-20250908_091534-f394z0xa/logs/debug-internal.log +11 -0
  50. output/wandb/run-20250908_091534-f394z0xa/logs/debug.log +24 -0
CausVid.egg-info/PKG-INFO ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ Metadata-Version: 2.4
2
+ Name: CausVid
3
+ Version: 0.0.1
4
+ License-File: LICENSE.md
5
+ Dynamic: license-file
CausVid.egg-info/SOURCES.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ LICENSE.md
2
+ README.md
3
+ setup.py
4
+ CausVid.egg-info/PKG-INFO
5
+ CausVid.egg-info/SOURCES.txt
6
+ CausVid.egg-info/dependency_links.txt
7
+ CausVid.egg-info/top_level.txt
CausVid.egg-info/dependency_links.txt ADDED
@@ -0,0 +1 @@
 
 
1
+
CausVid.egg-info/top_level.txt ADDED
@@ -0,0 +1 @@
 
 
1
+
configs/sdxl_8node_dmd_config.yaml ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: sdxl
2
+ generator_grad:
3
+ model: true
4
+ real_score_grad:
5
+ model: false
6
+ fake_score_grad:
7
+ model: true
8
+ denoising_step_list:
9
+ - 999
10
+ - 749
11
+ - 499
12
+ - 249
13
+ num_train_timestep: 1000
14
+ real_guidance_scale: 8.0
15
+ generator_task: image
16
+ denoising_loss_type: noise
17
+ mixed_precision: true
18
+ seed: 0
19
+ wandb_host: WANDB_HOST
20
+ wandb_key: WANDB_KEY
21
+ wandb_entity: tyin
22
+ wandb_project: causvid
23
+ wandb_name: causvid_sdxl_test_run_1node
24
+ sharding_strategy: full
25
+ lr: 5.0e-07
26
+ beta1: 0.9
27
+ beta2: 0.999
28
+ data_path: captions_laion6.25.txt
29
+ batch_size: 2
30
+ log_iters: 1000
31
+ negative_prompt: ''
32
+ dfake_gen_update_ratio: 5
33
+ image_or_video_shape:
34
+ - 2
35
+ - 1
36
+ - 4
37
+ - 128
38
+ - 128
39
+ output_path: /mnt/localssd/sdxl_logs
40
+ distillation_loss: dmd
41
+ gradient_checkpointing: false
42
+ warp_denoising_step: false
configs/wan_bidirectional_dmd.yaml ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: wan
2
+ generator_fsdp_wrap_strategy: size
3
+ real_score_fsdp_wrap_strategy: size
4
+ fake_score_fsdp_wrap_strategy: size
5
+ text_encoder_fsdp_wrap_strategy: size
6
+ generator_grad:
7
+ model: true
8
+ real_score_grad:
9
+ model: false
10
+ fake_score_grad:
11
+ model: true
12
+ denoising_step_list:
13
+ - 1000
14
+ - 757
15
+ - 522
16
+ num_train_timestep: 1000
17
+ timestep_shift: 8.0
18
+ real_guidance_scale: 3.5
19
+ generator_task: bidirectional_video
20
+ real_task_type: bidirectional_video
21
+ fake_task_type: bidirectional_video
22
+ denoising_loss_type: flow
23
+ mixed_precision: true
24
+ seed: 0
25
+ wandb_host: WANDB_HOST
26
+ wandb_key: WANDB_KEY
27
+ wandb_entity: tyin
28
+ wandb_project: causvid
29
+ wandb_name: wan_bidirectional_dmd
30
+ sharding_strategy: hybrid_full
31
+ lr: 2.0e-06
32
+ beta1: 0.9
33
+ beta2: 0.999
34
+ data_path: sample_dataset/mixkit_prompts.txt
35
+ batch_size: 1
36
+ log_iters: 200
37
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
38
+ dfake_gen_update_ratio: 5
39
+ image_or_video_shape:
40
+ - 1
41
+ - 21
42
+ - 16
43
+ - 60
44
+ - 104
45
+ output_path: /mnt/localssd/wan_bidirectional_dmd
46
+ distillation_loss: dmd
47
+ gradient_checkpointing: true
48
+ warp_denoising_step: false
configs/wan_bidirectional_dmd_from_scratch.yaml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: wan
2
+ generator_fsdp_wrap_strategy: size
3
+ real_score_fsdp_wrap_strategy: size
4
+ fake_score_fsdp_wrap_strategy: size
5
+ text_encoder_fsdp_wrap_strategy: size
6
+ generator_grad:
7
+ model: true
8
+ real_score_grad:
9
+ model: false
10
+ fake_score_grad:
11
+ model: true
12
+ denoising_step_list:
13
+ - 1000
14
+ - 757
15
+ - 522
16
+ num_train_timestep: 1000
17
+ timestep_shift: 8.0
18
+ real_guidance_scale: 3.5
19
+ generator_task: bidirectional_video
20
+ real_task_type: bidirectional_video
21
+ fake_task_type: bidirectional_video
22
+ denoising_loss_type: flow
23
+ mixed_precision: true
24
+ seed: 0
25
+ wandb_host: WANDB_HOST
26
+ wandb_key: WANDB_KEY
27
+ wandb_entity: tyin
28
+ wandb_project: causvid
29
+ wandb_name: wan_bidirectional_dmd_from_scratch
30
+ sharding_strategy: hybrid_full
31
+ lr: 2.0e-06
32
+ beta1: 0.9
33
+ beta2: 0.999
34
+ data_path: mixkit_latents_lmdb
35
+ batch_size: 1
36
+ log_iters: 200
37
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
38
+ dfake_gen_update_ratio: 5
39
+ image_or_video_shape:
40
+ - 1
41
+ - 21
42
+ - 16
43
+ - 60
44
+ - 104
45
+ output_path: /mnt/localssd/wan_bidirectional_dmd_from_scratch
46
+ distillation_loss: dmd
47
+ gradient_checkpointing: true
48
+ backward_simulation: false
49
+ warp_denoising_step: false
configs/wan_causal_dmd.yaml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: wan
2
+ generator_name: causal_wan
3
+ generator_ckpt: "wan_causal_ode_checkpoint_model_003000/model.pt"
4
+ generator_fsdp_wrap_strategy: size
5
+ real_score_fsdp_wrap_strategy: size
6
+ fake_score_fsdp_wrap_strategy: size
7
+ text_encoder_fsdp_wrap_strategy: size
8
+ generator_grad:
9
+ model: true
10
+ real_score_grad:
11
+ model: false
12
+ fake_score_grad:
13
+ model: true
14
+ denoising_step_list:
15
+ - 1000
16
+ - 757
17
+ - 522
18
+ - 0
19
+ num_train_timestep: 1000
20
+ timestep_shift: 8.0
21
+ real_guidance_scale: 3.5
22
+ generator_task: causal_video
23
+ real_task_type: bidirectional_video
24
+ fake_task_type: bidirectional_video
25
+ denoising_loss_type: flow
26
+ mixed_precision: true
27
+ seed: 0
28
+ wandb_host: WANDB_HOST
29
+ wandb_key: WANDB_KEY
30
+ wandb_entity: tyin
31
+ wandb_project: causvid
32
+ wandb_name: wan_causal_dmd
33
+ sharding_strategy: hybrid_full
34
+ lr: 2.0e-06
35
+ beta1: 0.9
36
+ beta2: 0.999
37
+ data_path: mixkit_latents_lmdb
38
+ batch_size: 1
39
+ log_iters: 200
40
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
41
+ dfake_gen_update_ratio: 5
42
+ image_or_video_shape:
43
+ - 1
44
+ - 21
45
+ - 16
46
+ - 60
47
+ - 104
48
+ output_path: /mnt/localssd/wan_causal_dmd
49
+ distillation_loss: dmd
50
+ gradient_checkpointing: true
51
+ backward_simulation: false
52
+ num_frame_per_block: 3
53
+ warp_denoising_step: false
configs/wan_causal_dmd_warp_4step_cfg2.yaml ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: wan
2
+ generator_name: causal_wan
3
+ generator_ckpt: "wan_causal_ode_checkpoint_model_003000/model.pt"
4
+ generator_fsdp_wrap_strategy: size
5
+ real_score_fsdp_wrap_strategy: size
6
+ fake_score_fsdp_wrap_strategy: size
7
+ text_encoder_fsdp_wrap_strategy: size
8
+ generator_grad:
9
+ model: true
10
+ real_score_grad:
11
+ model: false
12
+ fake_score_grad:
13
+ model: true
14
+ denoising_step_list:
15
+ - 1000
16
+ - 750
17
+ - 500
18
+ - 250
19
+ - 0
20
+ num_train_timestep: 1000
21
+ timestep_shift: 8.0
22
+ real_guidance_scale: 2.0
23
+ generator_task: causal_video
24
+ real_task_type: bidirectional_video
25
+ fake_task_type: bidirectional_video
26
+ denoising_loss_type: flow
27
+ mixed_precision: true
28
+ seed: 0
29
+ wandb_host: WANDB_HOST
30
+ wandb_key: WANDB_KEY
31
+ wandb_entity: tyin
32
+ wandb_project: causvid
33
+ wandb_name: wan_causal_dmd
34
+ sharding_strategy: hybrid_full
35
+ lr: 2.0e-06
36
+ beta1: 0.9
37
+ beta2: 0.999
38
+ data_path: mixkit_latents_lmdb
39
+ batch_size: 1
40
+ log_iters: 200
41
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
42
+ dfake_gen_update_ratio: 5
43
+ image_or_video_shape:
44
+ - 1
45
+ - 21
46
+ - 16
47
+ - 60
48
+ - 104
49
+ output_path: /mnt/localssd/wan_causal_dmd_warp_4step
50
+ distillation_loss: dmd
51
+ gradient_checkpointing: true
52
+ backward_simulation: false
53
+ num_frame_per_block: 3
54
+ warp_denoising_step: true
configs/wan_causal_ode.yaml ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_name: causal_wan
2
+ generator_ckpt: "pretrained_ode.pt"
3
+ generator_grad:
4
+ model: true
5
+ denoising_step_list:
6
+ - 1000
7
+ - 757
8
+ - 522
9
+ - 0
10
+ generator_task: causal_video
11
+ generator_fsdp_wrap_strategy: size
12
+ text_encoder_fsdp_wrap_strategy: size
13
+ mixed_precision: true
14
+ seed: 0
15
+ wandb_host: https://api.wandb.ai
16
+ wandb_key: 5409d3b960b01b25cec0f6abb5361b4022f0cc41
17
+ wandb_entity: liyitong-Tsinghua University
18
+ wandb_project: self-forcing
19
+ wandb_name: wan_causal_ode
20
+ sharding_strategy: hybrid_full
21
+ lr: 2.0e-06
22
+ beta1: 0.9
23
+ beta2: 0.999
24
+ data_path: ../mixkit_ode_lmdb
25
+ batch_size: 2
26
+ log_iters: 200
27
+ output_path: ./output
28
+ distillation_loss: ode
29
+ gradient_checkpointing: true
30
+ num_frame_per_block: 3
31
+ warp_denoising_step: false
output/wandb/run-20250908_063808-yfn0incq/files/output.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run dir: ./output/wandb/run-20250908_063808-yfn0incq/files
2
+ Start training step 0...
3
+ cache a block wise causal mask with block size of 3 frames
4
+ BlockMask(shape=(1, 1, 32768, 32768), sparsity=42.52%,
5
+ (0, 0)
6
+ ████░░
7
+ ████░░
8
+ ████░░░░░░░░
9
+ ██████████░░
10
+ ██████████░░
11
+ ██████████░░░░░░░░
12
+ ████████████████░░
13
+ ████████████████░░
14
+ ████████████████░░░░░░░░
15
+ ██████████████████████░░
16
+ ██████████████████████░░
17
+ ██████████████████████░░░░░░░░
18
+ ████████████████████████████░░
19
+ ████████████████████████████░░
20
+ ████████████████████████████████░░
21
+ ████████████████████████████████░░
22
+ ████████████████████████████████░░░░░░░░
23
+ ████████████████████████████████████████
24
+ ████████████████████████████████████████
25
+ ████████████████████████████████████████
26
+ )
output/wandb/run-20250908_063808-yfn0incq/files/requirements.txt ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nvidia-cuda-nvrtc-cu12==12.8.93
2
+ filelock==3.19.1
3
+ aiofiles==24.1.0
4
+ PyYAML==6.0.2
5
+ httpx==0.28.1
6
+ multidict==6.6.4
7
+ tifffile==2025.5.10
8
+ tzdata==2025.2
9
+ urllib3==2.5.0
10
+ decord==0.6.0
11
+ certifi==2025.8.3
12
+ setuptools==78.1.1
13
+ websocket-client==1.8.0
14
+ gitdb==4.0.12
15
+ yarl==1.20.1
16
+ tqdm==4.67.1
17
+ open_clip_torch==3.1.0
18
+ pyparsing==3.2.3
19
+ fastapi==0.116.1
20
+ nvidia-curand-cu12==10.3.9.90
21
+ mdurl==0.1.2
22
+ torchvision==0.23.0
23
+ h11==0.16.0
24
+ pytz==2025.2
25
+ six==1.17.0
26
+ nvidia-cufile-cu12==1.13.1.3
27
+ aiohappyeyeballs==2.6.1
28
+ wandb==0.21.3
29
+ nvidia-nvjitlink-cu12==12.8.93
30
+ cycler==0.12.1
31
+ anyio==4.10.0
32
+ scikit-image==0.25.2
33
+ nvidia-cuda-runtime-cu12==12.8.90
34
+ sentencepiece==0.2.1
35
+ rich==14.1.0
36
+ pydantic==2.11.7
37
+ GitPython==3.1.45
38
+ python-dateutil==2.9.0.post0
39
+ accelerate==1.10.1
40
+ proglog==0.1.12
41
+ sentry-sdk==2.37.0
42
+ nvidia-cusparselt-cu12==0.7.1
43
+ dashscope==1.24.3
44
+ platformdirs==4.4.0
45
+ safehttpx==0.1.6
46
+ fsspec==2025.9.0
47
+ lazy_loader==0.4
48
+ typing_extensions==4.15.0
49
+ semantic-version==2.10.0
50
+ numpy==1.24.4
51
+ nvidia-cufft-cu12==11.3.3.83
52
+ ruff==0.12.12
53
+ nvidia-cudnn-cu12==9.10.2.21
54
+ annotated-types==0.7.0
55
+ decorator==4.4.2
56
+ antlr4-python3-runtime==4.9.3
57
+ psutil==7.0.0
58
+ Brotli==1.1.0
59
+ tomlkit==0.13.3
60
+ httpcore==1.0.9
61
+ kiwisolver==1.4.9
62
+ nvidia-cusparse-cu12==12.5.8.93
63
+ groovy==0.1.2
64
+ protobuf==6.32.0
65
+ orjson==3.11.3
66
+ scipy==1.15.3
67
+ regex==2025.9.1
68
+ MarkupSafe==3.0.2
69
+ av==13.1.0
70
+ timm==1.0.19
71
+ uvicorn==0.35.0
72
+ wheel==0.45.1
73
+ Pygments==2.19.2
74
+ websockets==15.0.1
75
+ lmdb==1.7.3
76
+ sympy==1.14.0
77
+ einops==0.8.1
78
+ idna==3.10
79
+ triton==3.4.0
80
+ torch==2.8.0
81
+ moviepy==1.0.3
82
+ nvidia-nvtx-cu12==12.8.90
83
+ matplotlib==3.10.6
84
+ pillow==11.3.0
85
+ charset-normalizer==3.4.3
86
+ attrs==25.3.0
87
+ aiosignal==1.4.0
88
+ markdown-it-py==4.0.0
89
+ requests==2.32.5
90
+ typer==0.17.4
91
+ huggingface-hub==0.34.4
92
+ nvidia-nccl-cu12==2.27.3
93
+ propcache==0.3.2
94
+ opencv-python==4.11.0.86
95
+ ffmpy==0.6.1
96
+ jmespath==1.0.1
97
+ botocore==1.40.25
98
+ pydantic_core==2.33.2
99
+ fonttools==4.59.2
100
+ omegaconf==2.3.0
101
+ pycparser==2.22
102
+ mpmath==1.3.0
103
+ flash_attn==2.8.3
104
+ smmap==5.0.2
105
+ gradio_client==1.12.1
106
+ exceptiongroup==1.3.0
107
+ cffi==1.17.1
108
+ diffusers==0.31.0
109
+ nvidia-cusolver-cu12==11.7.3.90
110
+ contourpy==1.3.2
111
+ cryptography==45.0.7
112
+ nvidia-cuda-cupti-cu12==12.8.90
113
+ wcwidth==0.2.13
114
+ zipp==3.23.0
115
+ safetensors==0.6.2
116
+ gradio==5.44.1
117
+ click==8.2.1
118
+ frozenlist==1.7.0
119
+ networkx==3.4.2
120
+ s3transfer==0.13.1
121
+ shellingham==1.5.4
122
+ starlette==0.47.3
123
+ packaging==25.0
124
+ ftfy==6.3.1
125
+ importlib_metadata==8.7.0
126
+ transformers==4.56.1
127
+ nvidia-cublas-cu12==12.8.4.1
128
+ Jinja2==3.1.6
129
+ pycocotools==2.0.10
130
+ sniffio==1.3.1
131
+ hf-xet==1.1.9
132
+ typing-inspection==0.4.1
133
+ pandas==2.3.2
134
+ python-multipart==0.0.20
135
+ aiohttp==3.12.15
136
+ clip==1.0
137
+ pydub==0.25.1
138
+ easydict==1.13
139
+ pip==25.2
140
+ tokenizers==0.22.0
141
+ imageio==2.37.0
142
+ async-timeout==5.0.1
143
+ boto3==1.40.25
144
+ imageio-ffmpeg==0.6.0
145
+ CausVid==0.0.1
output/wandb/run-20250908_063808-yfn0incq/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T06:38:08.309033Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1367494828032"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "051fauhxsqz43onnqgc6jbdjqxushh74"
93
+ }
output/wandb/run-20250908_063808-yfn0incq/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T06:38:08.329996016Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpmfwk91u6/port-3438882.txt","pid":3438882,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T06:38:08.330648777Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3438882}
3
+ {"time":"2025-09-08T06:38:08.330657813Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3438882-3439217-2707863955/socket","Net":"unix"}}
4
+ {"time":"2025-09-08T06:38:08.516356689Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T06:38:08.52538569Z","level":"INFO","msg":"handleInformInit: received","streamId":"yfn0incq","id":"1(@)"}
6
+ {"time":"2025-09-08T06:38:08.725905857Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"yfn0incq","id":"1(@)"}
7
+ {"time":"2025-09-08T06:46:21.545953845Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
output/wandb/run-20250908_063808-yfn0incq/logs/debug-internal.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T06:38:08.52564227Z","level":"INFO","msg":"stream: starting","core version":"0.21.3"}
2
+ {"time":"2025-09-08T06:38:08.725733203Z","level":"INFO","msg":"stream: created new stream","id":"yfn0incq"}
3
+ {"time":"2025-09-08T06:38:08.725892734Z","level":"INFO","msg":"stream: started","id":"yfn0incq"}
4
+ {"time":"2025-09-08T06:38:08.725914161Z","level":"INFO","msg":"writer: started","stream_id":"yfn0incq"}
5
+ {"time":"2025-09-08T06:38:08.725929156Z","level":"INFO","msg":"sender: started","stream_id":"yfn0incq"}
6
+ {"time":"2025-09-08T06:38:08.725920349Z","level":"INFO","msg":"handler: started","stream_id":"yfn0incq"}
output/wandb/run-20250908_063808-yfn0incq/logs/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_setup.py:_flush():81] Current SDK version is 0.21.3
2
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_setup.py:_flush():81] Configure stats pid to 3438882
3
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/.config/wandb/settings
4
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/CausVid/wandb/settings
5
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_init.py:setup_run_log_directory():686] Logging user logs to ./output/wandb/run-20250908_063808-yfn0incq/logs/debug.log
7
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to ./output/wandb/run-20250908_063808-yfn0incq/logs/debug-internal.log
8
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_init.py:init():813] calling init triggers
9
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'model_name': 'causal_wan', 'generator_grad': {'model': True}, 'denoising_step_list': [1000, 757, 522, 0], 'generator_task': 'causal_video', 'generator_fsdp_wrap_strategy': 'size', 'text_encoder_fsdp_wrap_strategy': 'size', 'mixed_precision': True, 'seed': 9828283, 'wandb_host': 'https://api.wandb.ai', 'wandb_key': '5409d3b960b01b25cec0f6abb5361b4022f0cc41', 'wandb_entity': 'liyitong-Tsinghua University', 'wandb_project': 'self-forcing', 'wandb_name': 'wan_causal_ode', 'sharding_strategy': 'hybrid_full', 'lr': 2e-06, 'beta1': 0.9, 'beta2': 0.999, 'data_path': '../mixkit_ode_lmdb', 'batch_size': 2, 'log_iters': 200, 'output_path': './output', 'distillation_loss': 'ode', 'gradient_checkpointing': True, 'num_frame_per_block': 3, 'warp_denoising_step': False, 'no_save': False, '_wandb': {}}
11
+ 2025-09-08 06:38:08,310 INFO MainThread:3438882 [wandb_init.py:init():854] starting backend
12
+ 2025-09-08 06:38:08,516 INFO MainThread:3438882 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-09-08 06:38:08,520 INFO MainThread:3438882 [wandb_init.py:init():865] backend started and connected
14
+ 2025-09-08 06:38:08,523 INFO MainThread:3438882 [wandb_init.py:init():936] updated telemetry
15
+ 2025-09-08 06:38:08,528 INFO MainThread:3438882 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-09-08 06:38:08,916 INFO MainThread:3438882 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-09-08 06:38:09,029 INFO MainThread:3438882 [wandb_run.py:_console_start():2494] atexit reg
18
+ 2025-09-08 06:38:09,029 INFO MainThread:3438882 [wandb_run.py:_redirect():2342] redirect: wrap_raw
19
+ 2025-09-08 06:38:09,029 INFO MainThread:3438882 [wandb_run.py:_redirect():2411] Wrapping output streams.
20
+ 2025-09-08 06:38:09,030 INFO MainThread:3438882 [wandb_run.py:_redirect():2434] Redirects installed.
21
+ 2025-09-08 06:38:09,032 INFO MainThread:3438882 [wandb_init.py:init():1057] run started, returning control to user process
22
+ 2025-09-08 06:38:09,410 INFO MainThread:3438882 [wandb_run.py:_config_callback():1380] config_cb None None {'_wandb': {'code_path': 'source-self-forcing-causvid_train_ode.py'}}
output/wandb/run-20250908_063808-yfn0incq/run-yfn0incq.wandb ADDED
Binary file (98.3 kB). View file
 
output/wandb/run-20250908_064634-xd44venm/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T06:46:34.797035Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1367495385088"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "u3mfnczl6vj98a25sgfj3dvcuv00y0jd"
93
+ }
output/wandb/run-20250908_064634-xd44venm/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T06:46:34.819015681Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp9b1_vyfw/port-3454108.txt","pid":3454108,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T06:46:34.819705153Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3454108}
3
+ {"time":"2025-09-08T06:46:34.819700396Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3454108-3454427-2811185260/socket","Net":"unix"}}
4
+ {"time":"2025-09-08T06:46:35.005856196Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T06:46:35.017139949Z","level":"INFO","msg":"handleInformInit: received","streamId":"xd44venm","id":"1(@)"}
6
+ {"time":"2025-09-08T06:46:35.219626779Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"xd44venm","id":"1(@)"}
7
+ {"time":"2025-09-08T06:56:07.684243507Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
output/wandb/run-20250908_065643-lyib7g2q/files/output.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run dir: ./output/wandb/run-20250908_065643-lyib7g2q/files
2
+ cache a block wise causal mask with block size of 3 frames
3
+ BlockMask(shape=(1, 1, 32768, 32768), sparsity=42.52%,
4
+ (0, 0)
5
+ ████░░
6
+ ████░░
7
+ ████░░░░░░░░
8
+ ██████████░░
9
+ ██████████░░
10
+ ██████████░░░░░░░░
11
+ ████████████████░░
12
+ ████████████████░░
13
+ ████████████████░░░░░░░░
14
+ ██████████████████████░░
15
+ ██████████████████████░░
16
+ ██████████████████████░░░░░░░░
17
+ ████████████████████████████░░
18
+ ████████████████████████████░░
19
+ ████████████████████████████████░░
20
+ ████████████████████████████████░░
21
+ ████████████████████████████████░░░░░░░░
22
+ ████████████████████████████████████████
23
+ ████████████████████████████████████████
24
+ ████████████████████████████████████████
25
+ )
output/wandb/run-20250908_065643-lyib7g2q/files/requirements.txt ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nvidia-cuda-nvrtc-cu12==12.8.93
2
+ filelock==3.19.1
3
+ aiofiles==24.1.0
4
+ PyYAML==6.0.2
5
+ httpx==0.28.1
6
+ multidict==6.6.4
7
+ tifffile==2025.5.10
8
+ tzdata==2025.2
9
+ urllib3==2.5.0
10
+ decord==0.6.0
11
+ certifi==2025.8.3
12
+ setuptools==78.1.1
13
+ websocket-client==1.8.0
14
+ gitdb==4.0.12
15
+ yarl==1.20.1
16
+ tqdm==4.67.1
17
+ open_clip_torch==3.1.0
18
+ pyparsing==3.2.3
19
+ fastapi==0.116.1
20
+ nvidia-curand-cu12==10.3.9.90
21
+ mdurl==0.1.2
22
+ torchvision==0.23.0
23
+ h11==0.16.0
24
+ pytz==2025.2
25
+ six==1.17.0
26
+ nvidia-cufile-cu12==1.13.1.3
27
+ aiohappyeyeballs==2.6.1
28
+ wandb==0.21.3
29
+ nvidia-nvjitlink-cu12==12.8.93
30
+ cycler==0.12.1
31
+ anyio==4.10.0
32
+ scikit-image==0.25.2
33
+ nvidia-cuda-runtime-cu12==12.8.90
34
+ sentencepiece==0.2.1
35
+ rich==14.1.0
36
+ pydantic==2.11.7
37
+ GitPython==3.1.45
38
+ python-dateutil==2.9.0.post0
39
+ accelerate==1.10.1
40
+ proglog==0.1.12
41
+ sentry-sdk==2.37.0
42
+ nvidia-cusparselt-cu12==0.7.1
43
+ dashscope==1.24.3
44
+ platformdirs==4.4.0
45
+ safehttpx==0.1.6
46
+ fsspec==2025.9.0
47
+ lazy_loader==0.4
48
+ typing_extensions==4.15.0
49
+ semantic-version==2.10.0
50
+ numpy==1.24.4
51
+ nvidia-cufft-cu12==11.3.3.83
52
+ ruff==0.12.12
53
+ nvidia-cudnn-cu12==9.10.2.21
54
+ annotated-types==0.7.0
55
+ decorator==4.4.2
56
+ antlr4-python3-runtime==4.9.3
57
+ psutil==7.0.0
58
+ Brotli==1.1.0
59
+ tomlkit==0.13.3
60
+ httpcore==1.0.9
61
+ kiwisolver==1.4.9
62
+ nvidia-cusparse-cu12==12.5.8.93
63
+ groovy==0.1.2
64
+ protobuf==6.32.0
65
+ orjson==3.11.3
66
+ scipy==1.15.3
67
+ regex==2025.9.1
68
+ MarkupSafe==3.0.2
69
+ av==13.1.0
70
+ timm==1.0.19
71
+ uvicorn==0.35.0
72
+ wheel==0.45.1
73
+ Pygments==2.19.2
74
+ websockets==15.0.1
75
+ lmdb==1.7.3
76
+ sympy==1.14.0
77
+ einops==0.8.1
78
+ idna==3.10
79
+ triton==3.4.0
80
+ torch==2.8.0
81
+ moviepy==1.0.3
82
+ nvidia-nvtx-cu12==12.8.90
83
+ matplotlib==3.10.6
84
+ pillow==11.3.0
85
+ charset-normalizer==3.4.3
86
+ attrs==25.3.0
87
+ aiosignal==1.4.0
88
+ markdown-it-py==4.0.0
89
+ requests==2.32.5
90
+ typer==0.17.4
91
+ huggingface-hub==0.34.4
92
+ nvidia-nccl-cu12==2.27.3
93
+ propcache==0.3.2
94
+ opencv-python==4.11.0.86
95
+ ffmpy==0.6.1
96
+ jmespath==1.0.1
97
+ botocore==1.40.25
98
+ pydantic_core==2.33.2
99
+ fonttools==4.59.2
100
+ omegaconf==2.3.0
101
+ pycparser==2.22
102
+ mpmath==1.3.0
103
+ flash_attn==2.8.3
104
+ smmap==5.0.2
105
+ gradio_client==1.12.1
106
+ exceptiongroup==1.3.0
107
+ cffi==1.17.1
108
+ diffusers==0.31.0
109
+ nvidia-cusolver-cu12==11.7.3.90
110
+ contourpy==1.3.2
111
+ cryptography==45.0.7
112
+ nvidia-cuda-cupti-cu12==12.8.90
113
+ wcwidth==0.2.13
114
+ zipp==3.23.0
115
+ safetensors==0.6.2
116
+ gradio==5.44.1
117
+ click==8.2.1
118
+ frozenlist==1.7.0
119
+ networkx==3.4.2
120
+ s3transfer==0.13.1
121
+ shellingham==1.5.4
122
+ starlette==0.47.3
123
+ packaging==25.0
124
+ ftfy==6.3.1
125
+ importlib_metadata==8.7.0
126
+ transformers==4.56.1
127
+ nvidia-cublas-cu12==12.8.4.1
128
+ Jinja2==3.1.6
129
+ pycocotools==2.0.10
130
+ sniffio==1.3.1
131
+ hf-xet==1.1.9
132
+ typing-inspection==0.4.1
133
+ pandas==2.3.2
134
+ python-multipart==0.0.20
135
+ aiohttp==3.12.15
136
+ clip==1.0
137
+ pydub==0.25.1
138
+ easydict==1.13
139
+ pip==25.2
140
+ tokenizers==0.22.0
141
+ imageio==2.37.0
142
+ async-timeout==5.0.1
143
+ boto3==1.40.25
144
+ imageio-ffmpeg==0.6.0
145
+ CausVid==0.0.1
output/wandb/run-20250908_065643-lyib7g2q/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T06:56:43.722768Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1367495954432"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "nrbwifb91qzia1ndhn1iu2g7eodid6yk"
93
+ }
output/wandb/run-20250908_065643-lyib7g2q/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T06:56:43.750357486Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp4mhsv4lj/port-3470051.txt","pid":3470051,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T06:56:43.750987576Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3470051}
3
+ {"time":"2025-09-08T06:56:43.750983708Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3470051-3470349-2506732261/socket","Net":"unix"}}
4
+ {"time":"2025-09-08T06:56:43.936283119Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T06:56:43.944508948Z","level":"INFO","msg":"handleInformInit: received","streamId":"lyib7g2q","id":"1(@)"}
6
+ {"time":"2025-09-08T06:56:44.157850577Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"lyib7g2q","id":"1(@)"}
7
+ {"time":"2025-09-08T07:06:27.322661473Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
output/wandb/run-20250908_065643-lyib7g2q/logs/debug-internal.log ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T06:56:43.94460419Z","level":"INFO","msg":"stream: starting","core version":"0.21.3"}
2
+ {"time":"2025-09-08T06:56:44.157805156Z","level":"INFO","msg":"stream: created new stream","id":"lyib7g2q"}
3
+ {"time":"2025-09-08T06:56:44.157846153Z","level":"INFO","msg":"stream: started","id":"lyib7g2q"}
4
+ {"time":"2025-09-08T06:56:44.157856214Z","level":"INFO","msg":"handler: started","stream_id":"lyib7g2q"}
5
+ {"time":"2025-09-08T06:56:44.15785768Z","level":"INFO","msg":"sender: started","stream_id":"lyib7g2q"}
6
+ {"time":"2025-09-08T06:56:44.157877833Z","level":"INFO","msg":"writer: started","stream_id":"lyib7g2q"}
output/wandb/run-20250908_065643-lyib7g2q/logs/debug.log ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_setup.py:_flush():81] Current SDK version is 0.21.3
2
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_setup.py:_flush():81] Configure stats pid to 3470051
3
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/.config/wandb/settings
4
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/CausVid/wandb/settings
5
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_init.py:setup_run_log_directory():686] Logging user logs to ./output/wandb/run-20250908_065643-lyib7g2q/logs/debug.log
7
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to ./output/wandb/run-20250908_065643-lyib7g2q/logs/debug-internal.log
8
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_init.py:init():813] calling init triggers
9
+ 2025-09-08 06:56:43,725 INFO MainThread:3470051 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'model_name': 'causal_wan', 'generator_grad': {'model': True}, 'denoising_step_list': [1000, 757, 522, 0], 'generator_task': 'causal_video', 'generator_fsdp_wrap_strategy': 'size', 'text_encoder_fsdp_wrap_strategy': 'size', 'mixed_precision': True, 'seed': 7956051, 'wandb_host': 'https://api.wandb.ai', 'wandb_key': '5409d3b960b01b25cec0f6abb5361b4022f0cc41', 'wandb_entity': 'liyitong-Tsinghua University', 'wandb_project': 'self-forcing', 'wandb_name': 'wan_causal_ode', 'sharding_strategy': 'hybrid_full', 'lr': 2e-06, 'beta1': 0.9, 'beta2': 0.999, 'data_path': '../mixkit_ode_lmdb', 'batch_size': 2, 'log_iters': 200, 'output_path': './output', 'distillation_loss': 'ode', 'gradient_checkpointing': True, 'num_frame_per_block': 3, 'warp_denoising_step': False, 'no_save': False, '_wandb': {}}
11
+ 2025-09-08 06:56:43,726 INFO MainThread:3470051 [wandb_init.py:init():854] starting backend
12
+ 2025-09-08 06:56:43,936 INFO MainThread:3470051 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-09-08 06:56:43,942 INFO MainThread:3470051 [wandb_init.py:init():865] backend started and connected
14
+ 2025-09-08 06:56:43,949 INFO MainThread:3470051 [wandb_init.py:init():936] updated telemetry
15
+ 2025-09-08 06:56:43,956 INFO MainThread:3470051 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-09-08 06:56:44,314 INFO MainThread:3470051 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-09-08 06:56:44,487 INFO MainThread:3470051 [wandb_run.py:_console_start():2494] atexit reg
18
+ 2025-09-08 06:56:44,487 INFO MainThread:3470051 [wandb_run.py:_redirect():2342] redirect: wrap_raw
19
+ 2025-09-08 06:56:44,487 INFO MainThread:3470051 [wandb_run.py:_redirect():2411] Wrapping output streams.
20
+ 2025-09-08 06:56:44,487 INFO MainThread:3470051 [wandb_run.py:_redirect():2434] Redirects installed.
21
+ 2025-09-08 06:56:44,489 INFO MainThread:3470051 [wandb_init.py:init():1057] run started, returning control to user process
22
+ 2025-09-08 06:56:44,862 INFO MainThread:3470051 [wandb_run.py:_config_callback():1380] config_cb None None {'_wandb': {'code_path': 'source-self-forcing-causvid_train_ode.py'}}
output/wandb/run-20250908_081933-xtabuxq1/files/config.yaml ADDED
@@ -0,0 +1,159 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.21.3
4
+ code_path: source-self-forcing-causvid_train_ode.py
5
+ e:
6
+ 0fh2pmjwzgt2no6kkv0vzcqewqutpwmq:
7
+ args:
8
+ - --config_path
9
+ - configs/wan_causal_ode.yaml
10
+ codePath: causvid/train_ode.py
11
+ codePathLocal: causvid/train_ode.py
12
+ cpu_count: 48
13
+ cpu_count_logical: 96
14
+ cudaVersion: "12.8"
15
+ disk:
16
+ /:
17
+ total: "2079114358784"
18
+ used: "1383118893056"
19
20
+ executable: /home/yitongli/miniconda3/envs/causvid/bin/python3.10
21
+ git:
22
+ commit: adb6a5ecd07666b4d0290042915c8406e6d5ce22
23
+ remote: https://github.com/tianweiy/CausVid.git
24
+ gpu: NVIDIA A100-SXM4-80GB
25
+ gpu_count: 8
26
+ gpu_nvidia:
27
+ - architecture: Ampere
28
+ cudaCores: 6912
29
+ memoryTotal: "85899345920"
30
+ name: NVIDIA A100-SXM4-80GB
31
+ uuid: GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949
32
+ - architecture: Ampere
33
+ cudaCores: 6912
34
+ memoryTotal: "85899345920"
35
+ name: NVIDIA A100-SXM4-80GB
36
+ uuid: GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42
37
+ - architecture: Ampere
38
+ cudaCores: 6912
39
+ memoryTotal: "85899345920"
40
+ name: NVIDIA A100-SXM4-80GB
41
+ uuid: GPU-1f47056a-9c2c-8af1-8232-636203622830
42
+ - architecture: Ampere
43
+ cudaCores: 6912
44
+ memoryTotal: "85899345920"
45
+ name: NVIDIA A100-SXM4-80GB
46
+ uuid: GPU-38de1dff-a680-ec66-625b-49f2a31e3b42
47
+ - architecture: Ampere
48
+ cudaCores: 6912
49
+ memoryTotal: "85899345920"
50
+ name: NVIDIA A100-SXM4-80GB
51
+ uuid: GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204
52
+ - architecture: Ampere
53
+ cudaCores: 6912
54
+ memoryTotal: "85899345920"
55
+ name: NVIDIA A100-SXM4-80GB
56
+ uuid: GPU-194ed489-5bfa-defc-85b1-812953e7d84a
57
+ - architecture: Ampere
58
+ cudaCores: 6912
59
+ memoryTotal: "85899345920"
60
+ name: NVIDIA A100-SXM4-80GB
61
+ uuid: GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4
62
+ - architecture: Ampere
63
+ cudaCores: 6912
64
+ memoryTotal: "85899345920"
65
+ name: NVIDIA A100-SXM4-80GB
66
+ uuid: GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057
67
+ host: ip-172-31-3-169
68
+ memory:
69
+ total: "1204521443328"
70
+ os: Linux-6.8.0-1028-aws-x86_64-with-glibc2.39
71
+ program: /home/yitongli/CausVid/causvid/train_ode.py
72
+ python: CPython 3.10.18
73
+ root: ./output
74
+ startedAt: "2025-09-08T08:19:33.312470Z"
75
+ writerId: 0fh2pmjwzgt2no6kkv0vzcqewqutpwmq
76
+ m: []
77
+ python_version: 3.10.18
78
+ t:
79
+ "1":
80
+ - 1
81
+ - 11
82
+ - 41
83
+ - 49
84
+ - 71
85
+ - 83
86
+ - 105
87
+ "2":
88
+ - 1
89
+ - 11
90
+ - 41
91
+ - 49
92
+ - 71
93
+ - 83
94
+ - 105
95
+ "3":
96
+ - 16
97
+ - 17
98
+ "4": 3.10.18
99
+ "5": 0.21.3
100
+ "6": 4.56.1
101
+ "12": 0.21.3
102
+ "13": linux-x86_64
103
+ batch_size:
104
+ value: 2
105
+ beta1:
106
+ value: 0.9
107
+ beta2:
108
+ value: 0.999
109
+ data_path:
110
+ value: ../mixkit_ode_lmdb
111
+ denoising_step_list:
112
+ value:
113
+ - 1000
114
+ - 757
115
+ - 522
116
+ - 0
117
+ distillation_loss:
118
+ value: ode
119
+ generator_fsdp_wrap_strategy:
120
+ value: size
121
+ generator_grad:
122
+ value:
123
+ model: true
124
+ generator_task:
125
+ value: causal_video
126
+ gradient_checkpointing:
127
+ value: true
128
+ log_iters:
129
+ value: 200
130
+ lr:
131
+ value: 2e-06
132
+ mixed_precision:
133
+ value: true
134
+ model_name:
135
+ value: causal_wan
136
+ no_save:
137
+ value: false
138
+ num_frame_per_block:
139
+ value: 3
140
+ output_path:
141
+ value: ./output
142
+ seed:
143
+ value: 4894427
144
+ sharding_strategy:
145
+ value: hybrid_full
146
+ text_encoder_fsdp_wrap_strategy:
147
+ value: size
148
+ wandb_entity:
149
+ value: liyitong-Tsinghua University
150
+ wandb_host:
151
+ value: https://api.wandb.ai
152
+ wandb_key:
153
+ value: 5409d3b960b01b25cec0f6abb5361b4022f0cc41
154
+ wandb_name:
155
+ value: wan_causal_ode
156
+ wandb_project:
157
+ value: self-forcing
158
+ warp_denoising_step:
159
+ value: false
output/wandb/run-20250908_081933-xtabuxq1/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T08:19:33.312470Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1383118893056"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "0fh2pmjwzgt2no6kkv0vzcqewqutpwmq"
93
+ }
output/wandb/run-20250908_081933-xtabuxq1/logs/debug-core.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T08:19:33.333709351Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpl2jclwy9/port-3826501.txt","pid":3826501,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T08:19:33.334301481Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3826501}
3
+ {"time":"2025-09-08T08:19:33.334288666Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3826501-3826821-56449121/socket","Net":"unix"}}
4
+ {"time":"2025-09-08T08:19:33.519765449Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T08:19:33.527245947Z","level":"INFO","msg":"handleInformInit: received","streamId":"xtabuxq1","id":"1(@)"}
6
+ {"time":"2025-09-08T08:19:33.72624599Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"xtabuxq1","id":"1(@)"}
7
+ {"time":"2025-09-08T08:21:14.249662492Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2025-09-08T08:21:14.249744829Z","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2025-09-08T08:21:14.249739693Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2025-09-08T08:21:14.249900377Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-3826501-3826821-56449121/socket","Net":"unix"}}
11
+ {"time":"2025-09-08T08:21:14.249928173Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
12
+ {"time":"2025-09-08T08:21:14.74398118Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
13
+ {"time":"2025-09-08T08:21:14.744024642Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
14
+ {"time":"2025-09-08T08:21:14.74403815Z","level":"INFO","msg":"server is closed"}
output/wandb/run-20250908_081933-xtabuxq1/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_setup.py:_flush():81] Current SDK version is 0.21.3
2
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_setup.py:_flush():81] Configure stats pid to 3826501
3
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/.config/wandb/settings
4
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/CausVid/wandb/settings
5
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_init.py:setup_run_log_directory():686] Logging user logs to ./output/wandb/run-20250908_081933-xtabuxq1/logs/debug.log
7
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to ./output/wandb/run-20250908_081933-xtabuxq1/logs/debug-internal.log
8
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_init.py:init():813] calling init triggers
9
+ 2025-09-08 08:19:33,313 INFO MainThread:3826501 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'model_name': 'causal_wan', 'generator_grad': {'model': True}, 'denoising_step_list': [1000, 757, 522, 0], 'generator_task': 'causal_video', 'generator_fsdp_wrap_strategy': 'size', 'text_encoder_fsdp_wrap_strategy': 'size', 'mixed_precision': True, 'seed': 4894427, 'wandb_host': 'https://api.wandb.ai', 'wandb_key': '5409d3b960b01b25cec0f6abb5361b4022f0cc41', 'wandb_entity': 'liyitong-Tsinghua University', 'wandb_project': 'self-forcing', 'wandb_name': 'wan_causal_ode', 'sharding_strategy': 'hybrid_full', 'lr': 2e-06, 'beta1': 0.9, 'beta2': 0.999, 'data_path': '../mixkit_ode_lmdb', 'batch_size': 2, 'log_iters': 200, 'output_path': './output', 'distillation_loss': 'ode', 'gradient_checkpointing': True, 'num_frame_per_block': 3, 'warp_denoising_step': False, 'no_save': False, '_wandb': {}}
11
+ 2025-09-08 08:19:33,314 INFO MainThread:3826501 [wandb_init.py:init():854] starting backend
12
+ 2025-09-08 08:19:33,519 INFO MainThread:3826501 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-09-08 08:19:33,524 INFO MainThread:3826501 [wandb_init.py:init():865] backend started and connected
14
+ 2025-09-08 08:19:33,527 INFO MainThread:3826501 [wandb_init.py:init():936] updated telemetry
15
+ 2025-09-08 08:19:33,532 INFO MainThread:3826501 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-09-08 08:19:33,885 INFO MainThread:3826501 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-09-08 08:19:33,999 INFO MainThread:3826501 [wandb_run.py:_console_start():2494] atexit reg
18
+ 2025-09-08 08:19:33,999 INFO MainThread:3826501 [wandb_run.py:_redirect():2342] redirect: wrap_raw
19
+ 2025-09-08 08:19:33,999 INFO MainThread:3826501 [wandb_run.py:_redirect():2411] Wrapping output streams.
20
+ 2025-09-08 08:19:33,999 INFO MainThread:3826501 [wandb_run.py:_redirect():2434] Redirects installed.
21
+ 2025-09-08 08:19:34,001 INFO MainThread:3826501 [wandb_init.py:init():1057] run started, returning control to user process
22
+ 2025-09-08 08:19:35,140 INFO MainThread:3826501 [wandb_run.py:_config_callback():1380] config_cb None None {'_wandb': {'code_path': 'source-self-forcing-causvid_train_ode.py'}}
23
+ 2025-09-08 08:21:14,249 INFO wandb-AsyncioManager-main:3826501 [service_client.py:_forward_responses():84] Reached EOF.
24
+ 2025-09-08 08:21:14,250 INFO wandb-AsyncioManager-main:3826501 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
output/wandb/run-20250908_084516-b1cckt0e/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T08:45:16.764735165Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp2ihrl71u/port-3877754.txt","pid":3877754,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T08:45:16.76537437Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3877754}
3
+ {"time":"2025-09-08T08:45:16.765346611Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3877754-3878040-3730929431/socket","Net":"unix"}}
4
+ {"time":"2025-09-08T08:45:16.950019952Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T08:45:16.958321194Z","level":"INFO","msg":"handleInformInit: received","streamId":"b1cckt0e","id":"1(@)"}
6
+ {"time":"2025-09-08T08:45:17.166215832Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"b1cckt0e","id":"1(@)"}
7
+ {"time":"2025-09-08T08:48:41.404482127Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
output/wandb/run-20250908_084949-b9yvqkt5/files/config.yaml ADDED
@@ -0,0 +1,160 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.21.3
4
+ code_path: source-self-forcing-causvid_train_ode.py
5
+ e:
6
+ ytk5y3nz1jsnyvdlk65guvab4uhpkdm4:
7
+ args:
8
+ - --config_path
9
+ - configs/wan_causal_ode.yaml
10
+ codePath: causvid/train_ode.py
11
+ codePathLocal: causvid/train_ode.py
12
+ cpu_count: 48
13
+ cpu_count_logical: 96
14
+ cudaVersion: "12.8"
15
+ disk:
16
+ /:
17
+ total: "2079114358784"
18
+ used: "1386641809408"
19
20
+ executable: /home/yitongli/miniconda3/envs/causvid/bin/python3.10
21
+ git:
22
+ commit: adb6a5ecd07666b4d0290042915c8406e6d5ce22
23
+ remote: https://github.com/tianweiy/CausVid.git
24
+ gpu: NVIDIA A100-SXM4-80GB
25
+ gpu_count: 8
26
+ gpu_nvidia:
27
+ - architecture: Ampere
28
+ cudaCores: 6912
29
+ memoryTotal: "85899345920"
30
+ name: NVIDIA A100-SXM4-80GB
31
+ uuid: GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949
32
+ - architecture: Ampere
33
+ cudaCores: 6912
34
+ memoryTotal: "85899345920"
35
+ name: NVIDIA A100-SXM4-80GB
36
+ uuid: GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42
37
+ - architecture: Ampere
38
+ cudaCores: 6912
39
+ memoryTotal: "85899345920"
40
+ name: NVIDIA A100-SXM4-80GB
41
+ uuid: GPU-1f47056a-9c2c-8af1-8232-636203622830
42
+ - architecture: Ampere
43
+ cudaCores: 6912
44
+ memoryTotal: "85899345920"
45
+ name: NVIDIA A100-SXM4-80GB
46
+ uuid: GPU-38de1dff-a680-ec66-625b-49f2a31e3b42
47
+ - architecture: Ampere
48
+ cudaCores: 6912
49
+ memoryTotal: "85899345920"
50
+ name: NVIDIA A100-SXM4-80GB
51
+ uuid: GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204
52
+ - architecture: Ampere
53
+ cudaCores: 6912
54
+ memoryTotal: "85899345920"
55
+ name: NVIDIA A100-SXM4-80GB
56
+ uuid: GPU-194ed489-5bfa-defc-85b1-812953e7d84a
57
+ - architecture: Ampere
58
+ cudaCores: 6912
59
+ memoryTotal: "85899345920"
60
+ name: NVIDIA A100-SXM4-80GB
61
+ uuid: GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4
62
+ - architecture: Ampere
63
+ cudaCores: 6912
64
+ memoryTotal: "85899345920"
65
+ name: NVIDIA A100-SXM4-80GB
66
+ uuid: GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057
67
+ host: ip-172-31-3-169
68
+ memory:
69
+ total: "1204521443328"
70
+ os: Linux-6.8.0-1028-aws-x86_64-with-glibc2.39
71
+ program: /home/yitongli/CausVid/causvid/train_ode.py
72
+ python: CPython 3.10.18
73
+ root: ./output
74
+ startedAt: "2025-09-08T08:49:49.541042Z"
75
+ writerId: ytk5y3nz1jsnyvdlk65guvab4uhpkdm4
76
+ m: []
77
+ python_version: 3.10.18
78
+ t:
79
+ "1":
80
+ - 1
81
+ - 11
82
+ - 41
83
+ - 49
84
+ - 71
85
+ - 83
86
+ - 105
87
+ "2":
88
+ - 1
89
+ - 11
90
+ - 41
91
+ - 49
92
+ - 71
93
+ - 83
94
+ - 105
95
+ "3":
96
+ - 16
97
+ - 17
98
+ - 61
99
+ "4": 3.10.18
100
+ "5": 0.21.3
101
+ "6": 4.56.1
102
+ "12": 0.21.3
103
+ "13": linux-x86_64
104
+ batch_size:
105
+ value: 2
106
+ beta1:
107
+ value: 0.9
108
+ beta2:
109
+ value: 0.999
110
+ data_path:
111
+ value: ../mixkit_ode_lmdb
112
+ denoising_step_list:
113
+ value:
114
+ - 1000
115
+ - 757
116
+ - 522
117
+ - 0
118
+ distillation_loss:
119
+ value: ode
120
+ generator_fsdp_wrap_strategy:
121
+ value: size
122
+ generator_grad:
123
+ value:
124
+ model: true
125
+ generator_task:
126
+ value: causal_video
127
+ gradient_checkpointing:
128
+ value: true
129
+ log_iters:
130
+ value: 200
131
+ lr:
132
+ value: 2e-06
133
+ mixed_precision:
134
+ value: true
135
+ model_name:
136
+ value: causal_wan
137
+ no_save:
138
+ value: false
139
+ num_frame_per_block:
140
+ value: 3
141
+ output_path:
142
+ value: ./output
143
+ seed:
144
+ value: 2913400
145
+ sharding_strategy:
146
+ value: hybrid_full
147
+ text_encoder_fsdp_wrap_strategy:
148
+ value: size
149
+ wandb_entity:
150
+ value: liyitong-Tsinghua University
151
+ wandb_host:
152
+ value: https://api.wandb.ai
153
+ wandb_key:
154
+ value: 5409d3b960b01b25cec0f6abb5361b4022f0cc41
155
+ wandb_name:
156
+ value: wan_causal_ode
157
+ wandb_project:
158
+ value: self-forcing
159
+ warp_denoising_step:
160
+ value: false
output/wandb/run-20250908_084949-b9yvqkt5/files/output.log ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run dir: ./output/wandb/run-20250908_084949-b9yvqkt5/files
2
+ KV inference with 3 frames per block
3
+ ODERegression initialized.
4
+ cache a block wise causal mask with block size of 3 frames
5
+ BlockMask(shape=(1, 1, 32768, 32768), sparsity=42.52%,
6
+ (0, 0)
7
+ ████░░
8
+ ████░░
9
+ ████░░░░░░░░
10
+ ██████████░░
11
+ ██████████░░
12
+ ██████████░░░░░░░░
13
+ ████████████████░░
14
+ ████████████████░░
15
+ ████████████████░░░░░░░░
16
+ ██████████████████████░░
17
+ ██████████████████████░░
18
+ ██████████████████████░░░░░░░░
19
+ ████████████████████████████░░
20
+ ████████████████████████████░░
21
+ ████████████████████████████████░░
22
+ ████████████████████████████████░░
23
+ ████████████████████████████████░░░░░░░░
24
+ ████████████████████████████████████████
25
+ ████████████████████████████████████████
26
+ ████████████████████████████████████████
27
+ )
28
+ arrive
29
+ Start gathering distributed model states...
30
+ /home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc: https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial: https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
31
+ warnings.warn(
32
+ Model saved to ./output/2025-09-08-08-49-49.305637_seed2913400/checkpoint_model_000000/model.pt
33
+ training step 0...
34
+ ########### torch.Size([1, 21, 16, 60, 104])
35
+ Traceback (most recent call last):
36
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 229, in <module>
37
+ main()
38
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 223, in main
39
+ trainer.train()
40
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 187, in train
41
+ self.generate_video()
42
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 181, in generate_video
43
+ self.distillation_model.generate_video(ode_latent, conditional_dict)
44
+ File "/home/yitongli/CausVid/causvid/ode_regression.py", line 199, in generate_video
45
+ video = self.inference_pipeline.inference(
46
+ File "/home/yitongli/CausVid/causvid/models/wan/causal_inference.py", line 222, in inference
47
+ video = self.vae.decode_to_pixel(output)
48
+ File "/home/yitongli/CausVid/causvid/models/wan/wan_wrapper.py", line 83, in decode_to_pixel
49
+ output = [
50
+ File "/home/yitongli/CausVid/causvid/models/wan/wan_wrapper.py", line 84, in <listcomp>
51
+ self.model.decode(u.unsqueeze(0),
52
+ File "/home/yitongli/CausVid/causvid/models/wan/wan_base/modules/vae.py", line 553, in decode
53
+ x = self.conv2(z)
54
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl
55
+ return self._call_impl(*args, **kwargs)
56
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl
57
+ return forward_call(*args, **kwargs)
58
+ File "/home/yitongli/CausVid/causvid/models/wan/wan_base/modules/vae.py", line 36, in forward
59
+ return super().forward(x)
60
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 717, in forward
61
+ return self._conv_forward(input, self.weight, self.bias)
62
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 712, in _conv_forward
63
+ return F.conv3d(
64
+ RuntimeError: Input type (c10::BFloat16) and bias type (float) should be the same
65
+ [rank0]: Traceback (most recent call last):
66
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 229, in <module>
67
+ [rank0]: main()
68
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 223, in main
69
+ [rank0]: trainer.train()
70
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 187, in train
71
+ [rank0]: self.generate_video()
72
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 181, in generate_video
73
+ [rank0]: self.distillation_model.generate_video(ode_latent, conditional_dict)
74
+ [rank0]: File "/home/yitongli/CausVid/causvid/ode_regression.py", line 199, in generate_video
75
+ [rank0]: video = self.inference_pipeline.inference(
76
+ [rank0]: File "/home/yitongli/CausVid/causvid/models/wan/causal_inference.py", line 222, in inference
77
+ [rank0]: video = self.vae.decode_to_pixel(output)
78
+ [rank0]: File "/home/yitongli/CausVid/causvid/models/wan/wan_wrapper.py", line 83, in decode_to_pixel
79
+ [rank0]: output = [
80
+ [rank0]: File "/home/yitongli/CausVid/causvid/models/wan/wan_wrapper.py", line 84, in <listcomp>
81
+ [rank0]: self.model.decode(u.unsqueeze(0),
82
+ [rank0]: File "/home/yitongli/CausVid/causvid/models/wan/wan_base/modules/vae.py", line 553, in decode
83
+ [rank0]: x = self.conv2(z)
84
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl
85
+ [rank0]: return self._call_impl(*args, **kwargs)
86
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl
87
+ [rank0]: return forward_call(*args, **kwargs)
88
+ [rank0]: File "/home/yitongli/CausVid/causvid/models/wan/wan_base/modules/vae.py", line 36, in forward
89
+ [rank0]: return super().forward(x)
90
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 717, in forward
91
+ [rank0]: return self._conv_forward(input, self.weight, self.bias)
92
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 712, in _conv_forward
93
+ [rank0]: return F.conv3d(
94
+ [rank0]: RuntimeError: Input type (c10::BFloat16) and bias type (float) should be the same
output/wandb/run-20250908_084949-b9yvqkt5/files/requirements.txt ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nvidia-cuda-nvrtc-cu12==12.8.93
2
+ filelock==3.19.1
3
+ aiofiles==24.1.0
4
+ PyYAML==6.0.2
5
+ httpx==0.28.1
6
+ multidict==6.6.4
7
+ tifffile==2025.5.10
8
+ tzdata==2025.2
9
+ urllib3==2.5.0
10
+ decord==0.6.0
11
+ certifi==2025.8.3
12
+ setuptools==78.1.1
13
+ websocket-client==1.8.0
14
+ gitdb==4.0.12
15
+ yarl==1.20.1
16
+ tqdm==4.67.1
17
+ open_clip_torch==3.1.0
18
+ pyparsing==3.2.3
19
+ fastapi==0.116.1
20
+ nvidia-curand-cu12==10.3.9.90
21
+ mdurl==0.1.2
22
+ torchvision==0.23.0
23
+ h11==0.16.0
24
+ pytz==2025.2
25
+ six==1.17.0
26
+ nvidia-cufile-cu12==1.13.1.3
27
+ aiohappyeyeballs==2.6.1
28
+ wandb==0.21.3
29
+ nvidia-nvjitlink-cu12==12.8.93
30
+ cycler==0.12.1
31
+ anyio==4.10.0
32
+ scikit-image==0.25.2
33
+ nvidia-cuda-runtime-cu12==12.8.90
34
+ sentencepiece==0.2.1
35
+ rich==14.1.0
36
+ pydantic==2.11.7
37
+ GitPython==3.1.45
38
+ python-dateutil==2.9.0.post0
39
+ accelerate==1.10.1
40
+ proglog==0.1.12
41
+ sentry-sdk==2.37.0
42
+ nvidia-cusparselt-cu12==0.7.1
43
+ dashscope==1.24.3
44
+ platformdirs==4.4.0
45
+ safehttpx==0.1.6
46
+ fsspec==2025.9.0
47
+ lazy_loader==0.4
48
+ typing_extensions==4.15.0
49
+ semantic-version==2.10.0
50
+ numpy==1.24.4
51
+ nvidia-cufft-cu12==11.3.3.83
52
+ ruff==0.12.12
53
+ nvidia-cudnn-cu12==9.10.2.21
54
+ annotated-types==0.7.0
55
+ decorator==4.4.2
56
+ antlr4-python3-runtime==4.9.3
57
+ psutil==7.0.0
58
+ Brotli==1.1.0
59
+ tomlkit==0.13.3
60
+ httpcore==1.0.9
61
+ kiwisolver==1.4.9
62
+ nvidia-cusparse-cu12==12.5.8.93
63
+ groovy==0.1.2
64
+ protobuf==6.32.0
65
+ orjson==3.11.3
66
+ scipy==1.15.3
67
+ regex==2025.9.1
68
+ MarkupSafe==3.0.2
69
+ av==13.1.0
70
+ timm==1.0.19
71
+ uvicorn==0.35.0
72
+ wheel==0.45.1
73
+ Pygments==2.19.2
74
+ websockets==15.0.1
75
+ lmdb==1.7.3
76
+ sympy==1.14.0
77
+ einops==0.8.1
78
+ idna==3.10
79
+ triton==3.4.0
80
+ torch==2.8.0
81
+ moviepy==1.0.3
82
+ nvidia-nvtx-cu12==12.8.90
83
+ matplotlib==3.10.6
84
+ pillow==11.3.0
85
+ charset-normalizer==3.4.3
86
+ attrs==25.3.0
87
+ aiosignal==1.4.0
88
+ markdown-it-py==4.0.0
89
+ requests==2.32.5
90
+ typer==0.17.4
91
+ huggingface-hub==0.34.4
92
+ nvidia-nccl-cu12==2.27.3
93
+ propcache==0.3.2
94
+ opencv-python==4.11.0.86
95
+ ffmpy==0.6.1
96
+ jmespath==1.0.1
97
+ botocore==1.40.25
98
+ pydantic_core==2.33.2
99
+ fonttools==4.59.2
100
+ omegaconf==2.3.0
101
+ pycparser==2.22
102
+ mpmath==1.3.0
103
+ flash_attn==2.8.3
104
+ smmap==5.0.2
105
+ gradio_client==1.12.1
106
+ exceptiongroup==1.3.0
107
+ cffi==1.17.1
108
+ diffusers==0.31.0
109
+ nvidia-cusolver-cu12==11.7.3.90
110
+ contourpy==1.3.2
111
+ cryptography==45.0.7
112
+ nvidia-cuda-cupti-cu12==12.8.90
113
+ wcwidth==0.2.13
114
+ zipp==3.23.0
115
+ safetensors==0.6.2
116
+ gradio==5.44.1
117
+ click==8.2.1
118
+ frozenlist==1.7.0
119
+ networkx==3.4.2
120
+ s3transfer==0.13.1
121
+ shellingham==1.5.4
122
+ starlette==0.47.3
123
+ packaging==25.0
124
+ ftfy==6.3.1
125
+ importlib_metadata==8.7.0
126
+ transformers==4.56.1
127
+ nvidia-cublas-cu12==12.8.4.1
128
+ Jinja2==3.1.6
129
+ pycocotools==2.0.10
130
+ sniffio==1.3.1
131
+ hf-xet==1.1.9
132
+ typing-inspection==0.4.1
133
+ pandas==2.3.2
134
+ python-multipart==0.0.20
135
+ aiohttp==3.12.15
136
+ clip==1.0
137
+ pydub==0.25.1
138
+ easydict==1.13
139
+ pip==25.2
140
+ tokenizers==0.22.0
141
+ imageio==2.37.0
142
+ async-timeout==5.0.1
143
+ boto3==1.40.25
144
+ imageio-ffmpeg==0.6.0
145
+ CausVid==0.0.1
output/wandb/run-20250908_084949-b9yvqkt5/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T08:49:49.541042Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1386641809408"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "ytk5y3nz1jsnyvdlk65guvab4uhpkdm4"
93
+ }
output/wandb/run-20250908_084949-b9yvqkt5/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_wandb":{"runtime":134},"_runtime":134.067707153,"generator_loss":0.020751953125,"generator_grad_norm":5.278256416320801,"loss_at_time_250":0.016326904296875,"_timestamp":1.7573215036196253e+09,"_step":0}
output/wandb/run-20250908_084949-b9yvqkt5/logs/debug-core.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T08:49:49.562614129Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpr7mbm8le/port-3899796.txt","pid":3899796,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-09-08T08:49:49.563183638Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3899796-3900061-1880589413/socket","Net":"unix"}}
3
+ {"time":"2025-09-08T08:49:49.563187036Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3899796}
4
+ {"time":"2025-09-08T08:49:49.748718746Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-09-08T08:49:49.756209089Z","level":"INFO","msg":"handleInformInit: received","streamId":"b9yvqkt5","id":"1(@)"}
6
+ {"time":"2025-09-08T08:49:49.964234191Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"b9yvqkt5","id":"1(@)"}
7
+ {"time":"2025-09-08T08:52:04.255668903Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2025-09-08T08:52:04.255755182Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
9
+ {"time":"2025-09-08T08:52:04.255795637Z","level":"INFO","msg":"server is shutting down"}
10
+ {"time":"2025-09-08T08:52:04.256573202Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
11
+ {"time":"2025-09-08T08:52:04.263624933Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-3899796-3900061-1880589413/socket","Net":"unix"}}
12
+ {"time":"2025-09-08T08:52:04.76114449Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
13
+ {"time":"2025-09-08T08:52:04.761165019Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
14
+ {"time":"2025-09-08T08:52:04.761174679Z","level":"INFO","msg":"server is closed"}
output/wandb/run-20250908_084949-b9yvqkt5/logs/debug-internal.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T08:49:49.756354218Z","level":"INFO","msg":"stream: starting","core version":"0.21.3"}
2
+ {"time":"2025-09-08T08:49:49.964190017Z","level":"INFO","msg":"stream: created new stream","id":"b9yvqkt5"}
3
+ {"time":"2025-09-08T08:49:49.964229664Z","level":"INFO","msg":"stream: started","id":"b9yvqkt5"}
4
+ {"time":"2025-09-08T08:49:49.964243758Z","level":"INFO","msg":"writer: started","stream_id":"b9yvqkt5"}
5
+ {"time":"2025-09-08T08:49:49.964270263Z","level":"INFO","msg":"handler: started","stream_id":"b9yvqkt5"}
6
+ {"time":"2025-09-08T08:49:49.964261355Z","level":"INFO","msg":"sender: started","stream_id":"b9yvqkt5"}
7
+ {"time":"2025-09-08T08:52:04.25574272Z","level":"INFO","msg":"stream: closing","id":"b9yvqkt5"}
8
+ {"time":"2025-09-08T08:52:04.575873408Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
9
+ {"time":"2025-09-08T08:52:04.755032763Z","level":"INFO","msg":"handler: closed","stream_id":"b9yvqkt5"}
10
+ {"time":"2025-09-08T08:52:04.755112443Z","level":"INFO","msg":"sender: closed","stream_id":"b9yvqkt5"}
11
+ {"time":"2025-09-08T08:52:04.755121083Z","level":"INFO","msg":"stream: closed","id":"b9yvqkt5"}
output/wandb/run-20250908_084949-b9yvqkt5/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_setup.py:_flush():81] Current SDK version is 0.21.3
2
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_setup.py:_flush():81] Configure stats pid to 3899796
3
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/.config/wandb/settings
4
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/CausVid/wandb/settings
5
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_init.py:setup_run_log_directory():686] Logging user logs to ./output/wandb/run-20250908_084949-b9yvqkt5/logs/debug.log
7
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to ./output/wandb/run-20250908_084949-b9yvqkt5/logs/debug-internal.log
8
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_init.py:init():813] calling init triggers
9
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'model_name': 'causal_wan', 'generator_grad': {'model': True}, 'denoising_step_list': [1000, 757, 522, 0], 'generator_task': 'causal_video', 'generator_fsdp_wrap_strategy': 'size', 'text_encoder_fsdp_wrap_strategy': 'size', 'mixed_precision': True, 'seed': 2913400, 'wandb_host': 'https://api.wandb.ai', 'wandb_key': '5409d3b960b01b25cec0f6abb5361b4022f0cc41', 'wandb_entity': 'liyitong-Tsinghua University', 'wandb_project': 'self-forcing', 'wandb_name': 'wan_causal_ode', 'sharding_strategy': 'hybrid_full', 'lr': 2e-06, 'beta1': 0.9, 'beta2': 0.999, 'data_path': '../mixkit_ode_lmdb', 'batch_size': 2, 'log_iters': 200, 'output_path': './output', 'distillation_loss': 'ode', 'gradient_checkpointing': True, 'num_frame_per_block': 3, 'warp_denoising_step': False, 'no_save': False, '_wandb': {}}
11
+ 2025-09-08 08:49:49,542 INFO MainThread:3899796 [wandb_init.py:init():854] starting backend
12
+ 2025-09-08 08:49:49,748 INFO MainThread:3899796 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-09-08 08:49:49,752 INFO MainThread:3899796 [wandb_init.py:init():865] backend started and connected
14
+ 2025-09-08 08:49:49,754 INFO MainThread:3899796 [wandb_init.py:init():936] updated telemetry
15
+ 2025-09-08 08:49:49,759 INFO MainThread:3899796 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-09-08 08:49:50,186 INFO MainThread:3899796 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-09-08 08:49:50,300 INFO MainThread:3899796 [wandb_run.py:_console_start():2494] atexit reg
18
+ 2025-09-08 08:49:50,300 INFO MainThread:3899796 [wandb_run.py:_redirect():2342] redirect: wrap_raw
19
+ 2025-09-08 08:49:50,300 INFO MainThread:3899796 [wandb_run.py:_redirect():2411] Wrapping output streams.
20
+ 2025-09-08 08:49:50,301 INFO MainThread:3899796 [wandb_run.py:_redirect():2434] Redirects installed.
21
+ 2025-09-08 08:49:50,303 INFO MainThread:3899796 [wandb_init.py:init():1057] run started, returning control to user process
22
+ 2025-09-08 08:49:50,698 INFO MainThread:3899796 [wandb_run.py:_config_callback():1380] config_cb None None {'_wandb': {'code_path': 'source-self-forcing-causvid_train_ode.py'}}
23
+ 2025-09-08 08:52:04,255 INFO wandb-AsyncioManager-main:3899796 [service_client.py:_forward_responses():84] Reached EOF.
24
+ 2025-09-08 08:52:04,255 INFO wandb-AsyncioManager-main:3899796 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
output/wandb/run-20250908_084949-b9yvqkt5/run-b9yvqkt5.wandb ADDED
Binary file (42.6 kB). View file
 
output/wandb/run-20250908_085656-y8q57cbx/files/output.log ADDED
@@ -0,0 +1 @@
 
 
1
+ run dir: ./output/wandb/run-20250908_085656-y8q57cbx/files
output/wandb/run-20250908_085656-y8q57cbx/files/requirements.txt ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nvidia-cuda-nvrtc-cu12==12.8.93
2
+ filelock==3.19.1
3
+ aiofiles==24.1.0
4
+ PyYAML==6.0.2
5
+ httpx==0.28.1
6
+ multidict==6.6.4
7
+ tifffile==2025.5.10
8
+ tzdata==2025.2
9
+ urllib3==2.5.0
10
+ decord==0.6.0
11
+ certifi==2025.8.3
12
+ setuptools==78.1.1
13
+ websocket-client==1.8.0
14
+ gitdb==4.0.12
15
+ yarl==1.20.1
16
+ tqdm==4.67.1
17
+ open_clip_torch==3.1.0
18
+ pyparsing==3.2.3
19
+ fastapi==0.116.1
20
+ nvidia-curand-cu12==10.3.9.90
21
+ mdurl==0.1.2
22
+ torchvision==0.23.0
23
+ h11==0.16.0
24
+ pytz==2025.2
25
+ six==1.17.0
26
+ nvidia-cufile-cu12==1.13.1.3
27
+ aiohappyeyeballs==2.6.1
28
+ wandb==0.21.3
29
+ nvidia-nvjitlink-cu12==12.8.93
30
+ cycler==0.12.1
31
+ anyio==4.10.0
32
+ scikit-image==0.25.2
33
+ nvidia-cuda-runtime-cu12==12.8.90
34
+ sentencepiece==0.2.1
35
+ rich==14.1.0
36
+ pydantic==2.11.7
37
+ GitPython==3.1.45
38
+ python-dateutil==2.9.0.post0
39
+ accelerate==1.10.1
40
+ proglog==0.1.12
41
+ sentry-sdk==2.37.0
42
+ nvidia-cusparselt-cu12==0.7.1
43
+ dashscope==1.24.3
44
+ platformdirs==4.4.0
45
+ safehttpx==0.1.6
46
+ fsspec==2025.9.0
47
+ lazy_loader==0.4
48
+ typing_extensions==4.15.0
49
+ semantic-version==2.10.0
50
+ numpy==1.24.4
51
+ nvidia-cufft-cu12==11.3.3.83
52
+ ruff==0.12.12
53
+ nvidia-cudnn-cu12==9.10.2.21
54
+ annotated-types==0.7.0
55
+ decorator==4.4.2
56
+ antlr4-python3-runtime==4.9.3
57
+ psutil==7.0.0
58
+ Brotli==1.1.0
59
+ tomlkit==0.13.3
60
+ httpcore==1.0.9
61
+ kiwisolver==1.4.9
62
+ nvidia-cusparse-cu12==12.5.8.93
63
+ groovy==0.1.2
64
+ protobuf==6.32.0
65
+ orjson==3.11.3
66
+ scipy==1.15.3
67
+ regex==2025.9.1
68
+ MarkupSafe==3.0.2
69
+ av==13.1.0
70
+ timm==1.0.19
71
+ uvicorn==0.35.0
72
+ wheel==0.45.1
73
+ Pygments==2.19.2
74
+ websockets==15.0.1
75
+ lmdb==1.7.3
76
+ sympy==1.14.0
77
+ einops==0.8.1
78
+ idna==3.10
79
+ triton==3.4.0
80
+ torch==2.8.0
81
+ moviepy==1.0.3
82
+ nvidia-nvtx-cu12==12.8.90
83
+ matplotlib==3.10.6
84
+ pillow==11.3.0
85
+ charset-normalizer==3.4.3
86
+ attrs==25.3.0
87
+ aiosignal==1.4.0
88
+ markdown-it-py==4.0.0
89
+ requests==2.32.5
90
+ typer==0.17.4
91
+ huggingface-hub==0.34.4
92
+ nvidia-nccl-cu12==2.27.3
93
+ propcache==0.3.2
94
+ opencv-python==4.11.0.86
95
+ ffmpy==0.6.1
96
+ jmespath==1.0.1
97
+ botocore==1.40.25
98
+ pydantic_core==2.33.2
99
+ fonttools==4.59.2
100
+ omegaconf==2.3.0
101
+ pycparser==2.22
102
+ mpmath==1.3.0
103
+ flash_attn==2.8.3
104
+ smmap==5.0.2
105
+ gradio_client==1.12.1
106
+ exceptiongroup==1.3.0
107
+ cffi==1.17.1
108
+ diffusers==0.31.0
109
+ nvidia-cusolver-cu12==11.7.3.90
110
+ contourpy==1.3.2
111
+ cryptography==45.0.7
112
+ nvidia-cuda-cupti-cu12==12.8.90
113
+ wcwidth==0.2.13
114
+ zipp==3.23.0
115
+ safetensors==0.6.2
116
+ gradio==5.44.1
117
+ click==8.2.1
118
+ frozenlist==1.7.0
119
+ networkx==3.4.2
120
+ s3transfer==0.13.1
121
+ shellingham==1.5.4
122
+ starlette==0.47.3
123
+ packaging==25.0
124
+ ftfy==6.3.1
125
+ importlib_metadata==8.7.0
126
+ transformers==4.56.1
127
+ nvidia-cublas-cu12==12.8.4.1
128
+ Jinja2==3.1.6
129
+ pycocotools==2.0.10
130
+ sniffio==1.3.1
131
+ hf-xet==1.1.9
132
+ typing-inspection==0.4.1
133
+ pandas==2.3.2
134
+ python-multipart==0.0.20
135
+ aiohttp==3.12.15
136
+ clip==1.0
137
+ pydub==0.25.1
138
+ easydict==1.13
139
+ pip==25.2
140
+ tokenizers==0.22.0
141
+ imageio==2.37.0
142
+ async-timeout==5.0.1
143
+ boto3==1.40.25
144
+ imageio-ffmpeg==0.6.0
145
+ CausVid==0.0.1
output/wandb/run-20250908_085656-y8q57cbx/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T08:56:56.977649Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1396408811520"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "j1na06z1wvv9hx6dftanb741hwvst9hr"
93
+ }
output/wandb/run-20250908_085656-y8q57cbx/run-y8q57cbx.wandb ADDED
File without changes
output/wandb/run-20250908_091534-f394z0xa/files/config.yaml ADDED
@@ -0,0 +1,160 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.21.3
4
+ code_path: source-self-forcing-causvid_train_ode.py
5
+ e:
6
+ wcpbsusleulz3a9y7yho5o0ck602eklv:
7
+ args:
8
+ - --config_path
9
+ - configs/wan_causal_ode.yaml
10
+ codePath: causvid/train_ode.py
11
+ codePathLocal: causvid/train_ode.py
12
+ cpu_count: 48
13
+ cpu_count_logical: 96
14
+ cudaVersion: "12.8"
15
+ disk:
16
+ /:
17
+ total: "2079114358784"
18
+ used: "1396822892544"
19
20
+ executable: /home/yitongli/miniconda3/envs/causvid/bin/python3.10
21
+ git:
22
+ commit: adb6a5ecd07666b4d0290042915c8406e6d5ce22
23
+ remote: https://github.com/tianweiy/CausVid.git
24
+ gpu: NVIDIA A100-SXM4-80GB
25
+ gpu_count: 8
26
+ gpu_nvidia:
27
+ - architecture: Ampere
28
+ cudaCores: 6912
29
+ memoryTotal: "85899345920"
30
+ name: NVIDIA A100-SXM4-80GB
31
+ uuid: GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949
32
+ - architecture: Ampere
33
+ cudaCores: 6912
34
+ memoryTotal: "85899345920"
35
+ name: NVIDIA A100-SXM4-80GB
36
+ uuid: GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42
37
+ - architecture: Ampere
38
+ cudaCores: 6912
39
+ memoryTotal: "85899345920"
40
+ name: NVIDIA A100-SXM4-80GB
41
+ uuid: GPU-1f47056a-9c2c-8af1-8232-636203622830
42
+ - architecture: Ampere
43
+ cudaCores: 6912
44
+ memoryTotal: "85899345920"
45
+ name: NVIDIA A100-SXM4-80GB
46
+ uuid: GPU-38de1dff-a680-ec66-625b-49f2a31e3b42
47
+ - architecture: Ampere
48
+ cudaCores: 6912
49
+ memoryTotal: "85899345920"
50
+ name: NVIDIA A100-SXM4-80GB
51
+ uuid: GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204
52
+ - architecture: Ampere
53
+ cudaCores: 6912
54
+ memoryTotal: "85899345920"
55
+ name: NVIDIA A100-SXM4-80GB
56
+ uuid: GPU-194ed489-5bfa-defc-85b1-812953e7d84a
57
+ - architecture: Ampere
58
+ cudaCores: 6912
59
+ memoryTotal: "85899345920"
60
+ name: NVIDIA A100-SXM4-80GB
61
+ uuid: GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4
62
+ - architecture: Ampere
63
+ cudaCores: 6912
64
+ memoryTotal: "85899345920"
65
+ name: NVIDIA A100-SXM4-80GB
66
+ uuid: GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057
67
+ host: ip-172-31-3-169
68
+ memory:
69
+ total: "1204521443328"
70
+ os: Linux-6.8.0-1028-aws-x86_64-with-glibc2.39
71
+ program: /home/yitongli/CausVid/causvid/train_ode.py
72
+ python: CPython 3.10.18
73
+ root: ./output
74
+ startedAt: "2025-09-08T09:15:34.924173Z"
75
+ writerId: wcpbsusleulz3a9y7yho5o0ck602eklv
76
+ m: []
77
+ python_version: 3.10.18
78
+ t:
79
+ "1":
80
+ - 1
81
+ - 11
82
+ - 41
83
+ - 49
84
+ - 71
85
+ - 83
86
+ - 105
87
+ "2":
88
+ - 1
89
+ - 11
90
+ - 41
91
+ - 49
92
+ - 71
93
+ - 83
94
+ - 105
95
+ "3":
96
+ - 16
97
+ - 17
98
+ - 61
99
+ "4": 3.10.18
100
+ "5": 0.21.3
101
+ "6": 4.56.1
102
+ "12": 0.21.3
103
+ "13": linux-x86_64
104
+ batch_size:
105
+ value: 2
106
+ beta1:
107
+ value: 0.9
108
+ beta2:
109
+ value: 0.999
110
+ data_path:
111
+ value: ../mixkit_ode_lmdb
112
+ denoising_step_list:
113
+ value:
114
+ - 1000
115
+ - 757
116
+ - 522
117
+ - 0
118
+ distillation_loss:
119
+ value: ode
120
+ generator_fsdp_wrap_strategy:
121
+ value: size
122
+ generator_grad:
123
+ value:
124
+ model: true
125
+ generator_task:
126
+ value: causal_video
127
+ gradient_checkpointing:
128
+ value: true
129
+ log_iters:
130
+ value: 200
131
+ lr:
132
+ value: 2e-06
133
+ mixed_precision:
134
+ value: true
135
+ model_name:
136
+ value: causal_wan
137
+ no_save:
138
+ value: false
139
+ num_frame_per_block:
140
+ value: 3
141
+ output_path:
142
+ value: ./output
143
+ seed:
144
+ value: 4288120
145
+ sharding_strategy:
146
+ value: hybrid_full
147
+ text_encoder_fsdp_wrap_strategy:
148
+ value: size
149
+ wandb_entity:
150
+ value: liyitong-Tsinghua University
151
+ wandb_host:
152
+ value: https://api.wandb.ai
153
+ wandb_key:
154
+ value: 5409d3b960b01b25cec0f6abb5361b4022f0cc41
155
+ wandb_name:
156
+ value: wan_causal_ode
157
+ wandb_project:
158
+ value: self-forcing
159
+ warp_denoising_step:
160
+ value: false
output/wandb/run-20250908_091534-f394z0xa/files/output.log ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run dir: ./output/wandb/run-20250908_091534-f394z0xa/files
2
+ KV inference with 3 frames per block
3
+ ODERegression initialized.
4
+ cache a block wise causal mask with block size of 3 frames
5
+ BlockMask(shape=(1, 1, 32768, 32768), sparsity=42.52%,
6
+ (0, 0)
7
+ ████░░
8
+ ████░░
9
+ ████░░░░░░░░
10
+ ██████████░░
11
+ ██████████░░
12
+ ██████████░░░░░░░░
13
+ ████████████████░░
14
+ ████████████████░░
15
+ ████████████████░░░░░░░░
16
+ ██████████████████████░░
17
+ ██████████████████████░░
18
+ ██████████████████████░░░░░░░░
19
+ ████████████████████████████░░
20
+ ████████████████████████████░░
21
+ ████████████████████████████████░░
22
+ ████████████████████████████████░░
23
+ ████████████████████████████████░░░░░░░░
24
+ ████████████████████████████████████████
25
+ ████████████████████████████████████████
26
+ ████████████████████████████████████████
27
+ )
28
+ arrive
29
+ Start gathering distributed model states...
30
+ /home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc: https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial: https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
31
+ warnings.warn(
32
+ Model saved to ./output/2025-09-08-09-15-34.671833_seed4288120/checkpoint_model_000000/model.pt
33
+ training step 0...
34
+ Saving video: 0%| | 0/3 [00:00<?, ?it/s]
35
+ Traceback (most recent call last):
36
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 285, in <module>
37
+ main()
38
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 279, in main
39
+ trainer.train()
40
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 243, in train
41
+ self.generate_video()
42
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 217, in generate_video
43
+ save_video(video, output_path, fps=15, quality=5)
44
+ File "/home/yitongli/CausVid/causvid/train_ode.py", line 42, in save_video
45
+ writer.append_data(frame)
46
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/imageio/core/format.py", line 590, in append_data
47
+ return self._append_data(im, total_meta)
48
+ File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/imageio/plugins/ffmpeg.py", line 584, in _append_data
49
+ raise ValueError("Image must have 1, 2, 3 or 4 channels")
50
+ ValueError: Image must have 1, 2, 3 or 4 channels
51
+ [rank0]: Traceback (most recent call last):
52
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 285, in <module>
53
+ [rank0]: main()
54
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 279, in main
55
+ [rank0]: trainer.train()
56
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 243, in train
57
+ [rank0]: self.generate_video()
58
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 217, in generate_video
59
+ [rank0]: save_video(video, output_path, fps=15, quality=5)
60
+ [rank0]: File "/home/yitongli/CausVid/causvid/train_ode.py", line 42, in save_video
61
+ [rank0]: writer.append_data(frame)
62
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/imageio/core/format.py", line 590, in append_data
63
+ [rank0]: return self._append_data(im, total_meta)
64
+ [rank0]: File "/home/yitongli/miniconda3/envs/causvid/lib/python3.10/site-packages/imageio/plugins/ffmpeg.py", line 584, in _append_data
65
+ [rank0]: raise ValueError("Image must have 1, 2, 3 or 4 channels")
66
+ [rank0]: ValueError: Image must have 1, 2, 3 or 4 channels
output/wandb/run-20250908_091534-f394z0xa/files/requirements.txt ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nvidia-cuda-nvrtc-cu12==12.8.93
2
+ filelock==3.19.1
3
+ aiofiles==24.1.0
4
+ PyYAML==6.0.2
5
+ httpx==0.28.1
6
+ multidict==6.6.4
7
+ tifffile==2025.5.10
8
+ tzdata==2025.2
9
+ urllib3==2.5.0
10
+ decord==0.6.0
11
+ certifi==2025.8.3
12
+ setuptools==78.1.1
13
+ websocket-client==1.8.0
14
+ gitdb==4.0.12
15
+ yarl==1.20.1
16
+ tqdm==4.67.1
17
+ open_clip_torch==3.1.0
18
+ pyparsing==3.2.3
19
+ fastapi==0.116.1
20
+ nvidia-curand-cu12==10.3.9.90
21
+ mdurl==0.1.2
22
+ torchvision==0.23.0
23
+ h11==0.16.0
24
+ pytz==2025.2
25
+ six==1.17.0
26
+ nvidia-cufile-cu12==1.13.1.3
27
+ aiohappyeyeballs==2.6.1
28
+ wandb==0.21.3
29
+ nvidia-nvjitlink-cu12==12.8.93
30
+ cycler==0.12.1
31
+ anyio==4.10.0
32
+ scikit-image==0.25.2
33
+ nvidia-cuda-runtime-cu12==12.8.90
34
+ sentencepiece==0.2.1
35
+ rich==14.1.0
36
+ pydantic==2.11.7
37
+ GitPython==3.1.45
38
+ python-dateutil==2.9.0.post0
39
+ accelerate==1.10.1
40
+ proglog==0.1.12
41
+ sentry-sdk==2.37.0
42
+ nvidia-cusparselt-cu12==0.7.1
43
+ dashscope==1.24.3
44
+ platformdirs==4.4.0
45
+ safehttpx==0.1.6
46
+ fsspec==2025.9.0
47
+ lazy_loader==0.4
48
+ typing_extensions==4.15.0
49
+ semantic-version==2.10.0
50
+ numpy==1.24.4
51
+ nvidia-cufft-cu12==11.3.3.83
52
+ ruff==0.12.12
53
+ nvidia-cudnn-cu12==9.10.2.21
54
+ annotated-types==0.7.0
55
+ decorator==4.4.2
56
+ antlr4-python3-runtime==4.9.3
57
+ psutil==7.0.0
58
+ Brotli==1.1.0
59
+ tomlkit==0.13.3
60
+ httpcore==1.0.9
61
+ kiwisolver==1.4.9
62
+ nvidia-cusparse-cu12==12.5.8.93
63
+ groovy==0.1.2
64
+ protobuf==6.32.0
65
+ orjson==3.11.3
66
+ scipy==1.15.3
67
+ regex==2025.9.1
68
+ MarkupSafe==3.0.2
69
+ av==13.1.0
70
+ timm==1.0.19
71
+ uvicorn==0.35.0
72
+ wheel==0.45.1
73
+ Pygments==2.19.2
74
+ websockets==15.0.1
75
+ lmdb==1.7.3
76
+ sympy==1.14.0
77
+ einops==0.8.1
78
+ idna==3.10
79
+ triton==3.4.0
80
+ torch==2.8.0
81
+ moviepy==1.0.3
82
+ nvidia-nvtx-cu12==12.8.90
83
+ matplotlib==3.10.6
84
+ pillow==11.3.0
85
+ charset-normalizer==3.4.3
86
+ attrs==25.3.0
87
+ aiosignal==1.4.0
88
+ markdown-it-py==4.0.0
89
+ requests==2.32.5
90
+ typer==0.17.4
91
+ huggingface-hub==0.34.4
92
+ nvidia-nccl-cu12==2.27.3
93
+ propcache==0.3.2
94
+ opencv-python==4.11.0.86
95
+ ffmpy==0.6.1
96
+ jmespath==1.0.1
97
+ botocore==1.40.25
98
+ pydantic_core==2.33.2
99
+ fonttools==4.59.2
100
+ omegaconf==2.3.0
101
+ pycparser==2.22
102
+ mpmath==1.3.0
103
+ flash_attn==2.8.3
104
+ smmap==5.0.2
105
+ gradio_client==1.12.1
106
+ exceptiongroup==1.3.0
107
+ cffi==1.17.1
108
+ diffusers==0.31.0
109
+ nvidia-cusolver-cu12==11.7.3.90
110
+ contourpy==1.3.2
111
+ cryptography==45.0.7
112
+ nvidia-cuda-cupti-cu12==12.8.90
113
+ wcwidth==0.2.13
114
+ zipp==3.23.0
115
+ safetensors==0.6.2
116
+ gradio==5.44.1
117
+ click==8.2.1
118
+ frozenlist==1.7.0
119
+ networkx==3.4.2
120
+ s3transfer==0.13.1
121
+ shellingham==1.5.4
122
+ starlette==0.47.3
123
+ packaging==25.0
124
+ ftfy==6.3.1
125
+ importlib_metadata==8.7.0
126
+ transformers==4.56.1
127
+ nvidia-cublas-cu12==12.8.4.1
128
+ Jinja2==3.1.6
129
+ pycocotools==2.0.10
130
+ sniffio==1.3.1
131
+ hf-xet==1.1.9
132
+ typing-inspection==0.4.1
133
+ pandas==2.3.2
134
+ python-multipart==0.0.20
135
+ aiohttp==3.12.15
136
+ clip==1.0
137
+ pydub==0.25.1
138
+ easydict==1.13
139
+ pip==25.2
140
+ tokenizers==0.22.0
141
+ imageio==2.37.0
142
+ async-timeout==5.0.1
143
+ boto3==1.40.25
144
+ imageio-ffmpeg==0.6.0
145
+ CausVid==0.0.1
output/wandb/run-20250908_091534-f394z0xa/files/wandb-metadata.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1028-aws-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2025-09-08T09:15:34.924173Z",
5
+ "args": [
6
+ "--config_path",
7
+ "configs/wan_causal_ode.yaml"
8
+ ],
9
+ "program": "/home/yitongli/CausVid/causvid/train_ode.py",
10
+ "codePath": "causvid/train_ode.py",
11
+ "codePathLocal": "causvid/train_ode.py",
12
+ "git": {
13
+ "remote": "https://github.com/tianweiy/CausVid.git",
14
+ "commit": "adb6a5ecd07666b4d0290042915c8406e6d5ce22"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "./output",
18
+ "host": "ip-172-31-3-169",
19
+ "executable": "/home/yitongli/miniconda3/envs/causvid/bin/python3.10",
20
+ "cpu_count": 48,
21
+ "cpu_count_logical": 96,
22
+ "gpu": "NVIDIA A100-SXM4-80GB",
23
+ "gpu_count": 8,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2079114358784",
27
+ "used": "1396822892544"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "1204521443328"
32
+ },
33
+ "gpu_nvidia": [
34
+ {
35
+ "name": "NVIDIA A100-SXM4-80GB",
36
+ "memoryTotal": "85899345920",
37
+ "cudaCores": 6912,
38
+ "architecture": "Ampere",
39
+ "uuid": "GPU-88ce35f2-86d5-a394-f90d-a52e2cd45949"
40
+ },
41
+ {
42
+ "name": "NVIDIA A100-SXM4-80GB",
43
+ "memoryTotal": "85899345920",
44
+ "cudaCores": 6912,
45
+ "architecture": "Ampere",
46
+ "uuid": "GPU-1039594d-55ae-3eb3-339e-6d4d62c81d42"
47
+ },
48
+ {
49
+ "name": "NVIDIA A100-SXM4-80GB",
50
+ "memoryTotal": "85899345920",
51
+ "cudaCores": 6912,
52
+ "architecture": "Ampere",
53
+ "uuid": "GPU-1f47056a-9c2c-8af1-8232-636203622830"
54
+ },
55
+ {
56
+ "name": "NVIDIA A100-SXM4-80GB",
57
+ "memoryTotal": "85899345920",
58
+ "cudaCores": 6912,
59
+ "architecture": "Ampere",
60
+ "uuid": "GPU-38de1dff-a680-ec66-625b-49f2a31e3b42"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere",
67
+ "uuid": "GPU-712ffb29-5da2-92e5-99b7-9f148e8c1204"
68
+ },
69
+ {
70
+ "name": "NVIDIA A100-SXM4-80GB",
71
+ "memoryTotal": "85899345920",
72
+ "cudaCores": 6912,
73
+ "architecture": "Ampere",
74
+ "uuid": "GPU-194ed489-5bfa-defc-85b1-812953e7d84a"
75
+ },
76
+ {
77
+ "name": "NVIDIA A100-SXM4-80GB",
78
+ "memoryTotal": "85899345920",
79
+ "cudaCores": 6912,
80
+ "architecture": "Ampere",
81
+ "uuid": "GPU-21b1f0be-4c00-4af7-0649-9942ae8fd0e4"
82
+ },
83
+ {
84
+ "name": "NVIDIA A100-SXM4-80GB",
85
+ "memoryTotal": "85899345920",
86
+ "cudaCores": 6912,
87
+ "architecture": "Ampere",
88
+ "uuid": "GPU-195cca5b-c8ee-790b-4d30-ae4d7aa93057"
89
+ }
90
+ ],
91
+ "cudaVersion": "12.8",
92
+ "writerId": "wcpbsusleulz3a9y7yho5o0ck602eklv"
93
+ }
output/wandb/run-20250908_091534-f394z0xa/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"generator_grad_norm":2.03125,"loss_at_time_500":0.148712158203125,"_timestamp":1.7573230600618684e+09,"_step":0,"_wandb":{"runtime":142},"_runtime":142.749615808,"generator_loss":0.16015625}
output/wandb/run-20250908_091534-f394z0xa/logs/debug-internal.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-09-08T09:15:35.140001084Z","level":"INFO","msg":"stream: starting","core version":"0.21.3"}
2
+ {"time":"2025-09-08T09:15:35.350074186Z","level":"INFO","msg":"stream: created new stream","id":"f394z0xa"}
3
+ {"time":"2025-09-08T09:15:35.350117697Z","level":"INFO","msg":"stream: started","id":"f394z0xa"}
4
+ {"time":"2025-09-08T09:15:35.350127873Z","level":"INFO","msg":"sender: started","stream_id":"f394z0xa"}
5
+ {"time":"2025-09-08T09:15:35.350125845Z","level":"INFO","msg":"handler: started","stream_id":"f394z0xa"}
6
+ {"time":"2025-09-08T09:15:35.350157006Z","level":"INFO","msg":"writer: started","stream_id":"f394z0xa"}
7
+ {"time":"2025-09-08T09:17:58.289962144Z","level":"INFO","msg":"stream: closing","id":"f394z0xa"}
8
+ {"time":"2025-09-08T09:17:58.601880656Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
9
+ {"time":"2025-09-08T09:17:58.768362935Z","level":"INFO","msg":"handler: closed","stream_id":"f394z0xa"}
10
+ {"time":"2025-09-08T09:17:58.768430865Z","level":"INFO","msg":"sender: closed","stream_id":"f394z0xa"}
11
+ {"time":"2025-09-08T09:17:58.768439365Z","level":"INFO","msg":"stream: closed","id":"f394z0xa"}
output/wandb/run-20250908_091534-f394z0xa/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_setup.py:_flush():81] Current SDK version is 0.21.3
2
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_setup.py:_flush():81] Configure stats pid to 4032801
3
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/.config/wandb/settings
4
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_setup.py:_flush():81] Loading settings from /home/yitongli/CausVid/wandb/settings
5
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_init.py:setup_run_log_directory():686] Logging user logs to ./output/wandb/run-20250908_091534-f394z0xa/logs/debug.log
7
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to ./output/wandb/run-20250908_091534-f394z0xa/logs/debug-internal.log
8
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_init.py:init():813] calling init triggers
9
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'model_name': 'causal_wan', 'generator_grad': {'model': True}, 'denoising_step_list': [1000, 757, 522, 0], 'generator_task': 'causal_video', 'generator_fsdp_wrap_strategy': 'size', 'text_encoder_fsdp_wrap_strategy': 'size', 'mixed_precision': True, 'seed': 4288120, 'wandb_host': 'https://api.wandb.ai', 'wandb_key': '5409d3b960b01b25cec0f6abb5361b4022f0cc41', 'wandb_entity': 'liyitong-Tsinghua University', 'wandb_project': 'self-forcing', 'wandb_name': 'wan_causal_ode', 'sharding_strategy': 'hybrid_full', 'lr': 2e-06, 'beta1': 0.9, 'beta2': 0.999, 'data_path': '../mixkit_ode_lmdb', 'batch_size': 2, 'log_iters': 200, 'output_path': './output', 'distillation_loss': 'ode', 'gradient_checkpointing': True, 'num_frame_per_block': 3, 'warp_denoising_step': False, 'no_save': False, '_wandb': {}}
11
+ 2025-09-08 09:15:34,925 INFO MainThread:4032801 [wandb_init.py:init():854] starting backend
12
+ 2025-09-08 09:15:35,132 INFO MainThread:4032801 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-09-08 09:15:35,137 INFO MainThread:4032801 [wandb_init.py:init():865] backend started and connected
14
+ 2025-09-08 09:15:35,142 INFO MainThread:4032801 [wandb_init.py:init():936] updated telemetry
15
+ 2025-09-08 09:15:35,147 INFO MainThread:4032801 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-09-08 09:15:35,538 INFO MainThread:4032801 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-09-08 09:15:35,661 INFO MainThread:4032801 [wandb_run.py:_console_start():2494] atexit reg
18
+ 2025-09-08 09:15:35,661 INFO MainThread:4032801 [wandb_run.py:_redirect():2342] redirect: wrap_raw
19
+ 2025-09-08 09:15:35,661 INFO MainThread:4032801 [wandb_run.py:_redirect():2411] Wrapping output streams.
20
+ 2025-09-08 09:15:35,661 INFO MainThread:4032801 [wandb_run.py:_redirect():2434] Redirects installed.
21
+ 2025-09-08 09:15:35,664 INFO MainThread:4032801 [wandb_init.py:init():1057] run started, returning control to user process
22
+ 2025-09-08 09:15:36,097 INFO MainThread:4032801 [wandb_run.py:_config_callback():1380] config_cb None None {'_wandb': {'code_path': 'source-self-forcing-causvid_train_ode.py'}}
23
+ 2025-09-08 09:17:58,290 INFO wandb-AsyncioManager-main:4032801 [service_client.py:_forward_responses():84] Reached EOF.
24
+ 2025-09-08 09:17:58,290 INFO wandb-AsyncioManager-main:4032801 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.