Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/random_states_0.pkl +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/scheduler.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/config.json +33 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00001-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00002-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00003-of-00003.safetensors +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1500/optimizer.bin +3 -0
- models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1500/random_states_0.pkl +3 -0
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1618d4bb6981a1c07214c3132c86688516ad80ee71105cbd6329f8a5b7b3eddf
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9f85d5adab21fbd56386f98b169621d59c74d0b2a87a0bc872e9212e66b02aa
|
3 |
+
size 16100
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9682b9b65c47b86fbced2afa76caa57881592d40b28fa757a99b88e164e6c421
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b868430967b0267f24646d862b3c969837cbde04d4cdcc0feab6771ae1064c1
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1a4ffb6a06d232ecc4901be3cf6608e654d9a34025fbb19a003f94d4cf6aeac
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b5c844e6bfe7b011368529cb294a9ff91ed93655d60e088dbd3b411b25a914
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-100/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:653121e3880ec96977b9dd4cdf086b33dcf4f2af9ad8d53d60cf7edba5a558d5
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04151d41355990624dd49336a32c3669f0933846480e6f58c0c7416712f6caa5
|
3 |
+
size 16100
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c1d2cbbd480c80636d0e6c51c8da8b894e4841dafb5c2c01a78e65e8486eb49
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50857fc03f7083a489b1b57abd98c7dfaa8463c870941688b855e83a74bbc9d4
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a03d54c2aad9e102f4c1cac6d3e0945a080af1b9cd3247118d86917526bfe07a
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92ea3fe25d55f9fee8e042401016038036f27d1fda906acb930a34d4a0b08c32
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1000/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:061fccf2f5e686b583f67afa93c053f11d71a96b7ffa1da85e1ebabdca47fa6b
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8634c27e1b0e3398f01a2526b9df2d92c3398157a6752b2e73c8c9dd0f8503b7
|
3 |
+
size 16100
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ebfd2730e1f7370bcc13917fbde7fa9ceacb1aaa849f7693d3f98a4e7c73175
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:853667f199168fec9f3f2c6a02c3d8d88b35eb2690030f0c0a6f733752eda78d
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fab3c7d02c62f2bb71be37c1604e6b60f5d77f63b0b62a7f8ca765ebec8e2ee0
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b47666aa9eaa935256b7855187180c6ff882e05b231ee1a6ac8a651d937f31c
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1100/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e3c08c356a887503bbe13b5540e9bc580045d54b2af258f7031423471414dd1
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bedde6ebde66ff81a9fd5b1595a3e2b4bc567a01f4f5f940ba1661ce3cbfa7c6
|
3 |
+
size 16100
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a9ddf2479936555268818688e54f8d3cc66dd059bd394e34f8ffd5450378591
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a80b1595683107526fa1fee49ccbc5545ed68cc8f37c7a86c6c2483b872d44e2
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92c58c14c0b1420f15bbdf28f232559df69165a5b08389abb62f132d891f1742
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b27a8389f2fbd596eb6bd477d13b0591990bfe798742c31f542cb8faf87cd957
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1200/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4249fbe12c0474e0d74f3090a42aff0549c18755d0906ebe5b81615680a4b538
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e317026162505770c20d119a7b48ccd966917fffca35c21d5abede68f28ad4bc
|
3 |
+
size 16036
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c97a0847ee1e80266cbf242308321f2472d698d4292134ef577aa83fe218824b
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12b5bcd9b8bc001886f62bfb66a0c041234730524853f1c05a0f6253684816ed
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aca4f34fa3c1d35e3cbc5717600cb245f1da8a26d72d94154441d6e124e7414c
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7957f9ec079ec9a5e3ddf1c487c50dd0f00904d4547bbb8a71ae07da8a129c72
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1300/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77c5188f00736e873819a968cfefd1125bd582d20910ed73fa52fbe610dee02b
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb42cd3f78cb94a406f30994f25828bc03e5c83b4ff4aa2ed06fddd231ec9b6f
|
3 |
+
size 16036
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d436b8993c2407f75abd90010e9df802a39351334b5585f24fb3e331e1ab22a
|
3 |
+
size 1000
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "CogVideoXTransformer3DModel",
|
3 |
+
"_diffusers_version": "0.33.0.dev0",
|
4 |
+
"_name_or_path": "THUDM/CogVideoX-5b",
|
5 |
+
"activation_fn": "gelu-approximate",
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_head_dim": 64,
|
8 |
+
"dropout": 0.0,
|
9 |
+
"flip_sin_to_cos": true,
|
10 |
+
"freq_shift": 0,
|
11 |
+
"in_channels": 16,
|
12 |
+
"max_text_seq_length": 226,
|
13 |
+
"norm_elementwise_affine": true,
|
14 |
+
"norm_eps": 1e-05,
|
15 |
+
"num_attention_heads": 48,
|
16 |
+
"num_layers": 42,
|
17 |
+
"ofs_embed_dim": null,
|
18 |
+
"out_channels": 16,
|
19 |
+
"patch_bias": false,
|
20 |
+
"patch_size": 2,
|
21 |
+
"patch_size_t": 2,
|
22 |
+
"sample_frames": 81,
|
23 |
+
"sample_height": 60,
|
24 |
+
"sample_width": 90,
|
25 |
+
"spatial_interpolation_scale": 1.875,
|
26 |
+
"temporal_compression_ratio": 4,
|
27 |
+
"temporal_interpolation_scale": 1.0,
|
28 |
+
"text_embed_dim": 4096,
|
29 |
+
"time_embed_dim": 512,
|
30 |
+
"timestep_activation_fn": "silu",
|
31 |
+
"use_learned_positional_embeddings": false,
|
32 |
+
"use_rotary_positional_embeddings": true
|
33 |
+
}
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e51ae408c45a147d0e3436d5685cf50ae0ffe9ecf2f7937154ceeceab923117
|
3 |
+
size 4977695424
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7725b69f46d6fb0e8a8161e628525adb71c7a52e43fdad5fbd1474743eaa7785
|
3 |
+
size 4948039832
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3280187a227d1a51d214120c9263b7c353c4adda1763eee820542769bc41971a
|
3 |
+
size 1215733728
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1400/transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c386b73086f2755e62f7ead442d87cbc3a5a5ae273ae8797d8709dca51ee90b
|
3 |
+
size 22283593862
|
models/cogvideox-sft__optimizer_adamw__steps_20000__lr-schedule_cosine_with_restarts__learning-rate_1e-4_0104/checkpoint-1500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:318a55ef49b0d5075789ce127937bec7e050a39ca3c963200c528b142a81b1c5
|
3 |
+
size 16036
|