| { | |
| "image_dim": 4, | |
| "image_size": 1024, | |
| "image_stride": 8, | |
| "text_token_dim": 2560, | |
| "text_token_len": 256, | |
| "video_base_size": [ | |
| 1, | |
| 32, | |
| 32 | |
| ], | |
| "image_base_size": [ | |
| 64, | |
| 64 | |
| ], | |
| "arch": [ | |
| "vit_d16w1024", | |
| "vit_d32w1024", | |
| "mlp_d6w1024" | |
| ] | |
| } | |
| { | |
| "image_dim": 4, | |
| "image_size": 1024, | |
| "image_stride": 8, | |
| "text_token_dim": 2560, | |
| "text_token_len": 256, | |
| "video_base_size": [ | |
| 1, | |
| 32, | |
| 32 | |
| ], | |
| "image_base_size": [ | |
| 64, | |
| 64 | |
| ], | |
| "arch": [ | |
| "vit_d16w1024", | |
| "vit_d32w1024", | |
| "mlp_d6w1024" | |
| ] | |
| } | |