Yysrc commited on
Commit
ccca3d9
·
verified ·
1 Parent(s): 3408fc9

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +43 -0
config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_gradient_checkpointing": true,
3
+ "_name_or_path": "Yysrc/Mantis-Base",
4
+ "action_dim": 7,
5
+ "action_model_type": "DiT-L",
6
+ "architectures": [
7
+ "Mantis"
8
+ ],
9
+ "attn_implementation": null,
10
+ "connector_num_hidden_layers": 12,
11
+ "diffusion_model_id": "Efficient-Large-Model/Sana_600M_512px_diffusers",
12
+ "future_action_window_size": 4,
13
+ "in_channels": 32,
14
+ "input_size": 16,
15
+ "loss_type": "flow",
16
+ "max_input_text_tokens": 256,
17
+ "max_timestep_gap": 6,
18
+ "mllm_id": "Qwen/Qwen2.5-VL-3B-Instruct",
19
+ "model_type": "mantis",
20
+ "modules_to_freeze": [
21
+ "vae",
22
+ "model.mllm_backbone.visual"
23
+ ],
24
+ "modules_to_unfreeze": [
25
+ "model.mllm_backbone.model.embed_tokens",
26
+ "model.policy_head",
27
+ "model.transformer",
28
+ "model.connector",
29
+ "model.mllm_backbone.model"
30
+ ],
31
+ "noise_scheduler_id": "Efficient-Large-Model/Sana_600M_512px_diffusers",
32
+ "num_actqueries": 6,
33
+ "num_gapqueries": 3,
34
+ "num_metaqueries": 9,
35
+ "past_action_window_size": 0,
36
+ "scheduler_id": "Efficient-Large-Model/Sana_600M_512px_diffusers",
37
+ "system_prompt": "You will be provided with an image observation and a corresponding instruction.",
38
+ "torch_dtype": "float32",
39
+ "training_mode": "image_action_language",
40
+ "transformers_version": "4.49.0",
41
+ "vae_downsample_f": 32,
42
+ "vae_id": "Efficient-Large-Model/Sana_600M_512px_diffusers"
43
+ }