Upload folder using huggingface_hub
Browse files- .gitattributes +1 -0
- checkpoints/step-039000-epoch-192-loss=0.0263.pt +3 -0
- config.json +59 -0
- config.yaml +55 -0
- dataset_statistics.json +133 -0
- eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_23-step-039000-epoch-192-loss=0.0263.txt +0 -0
- eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_28-step-039000-epoch-192-loss=0.0263.txt +0 -0
- eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_40-step-039000-epoch-192-loss=0.0263.txt +0 -0
- run-metrics.jsonl +1 -0
- sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1.jsonl +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1.jsonl filter=lfs diff=lfs merge=lfs -text
|
checkpoints/step-039000-epoch-192-loss=0.0263.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:536f25f289267d93fa1782f8003645dbaadef084a572aa3a7a34c4a3bd837373
|
| 3 |
+
size 11322827655
|
config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"action_dim": 7,
|
| 3 |
+
"action_model_type": "DiT-B",
|
| 4 |
+
"data_root_dir": "/mnt/inspurfs/efm_t/robot_data/cache/LIBERO/dataset",
|
| 5 |
+
"debug": false,
|
| 6 |
+
"disable_instruction": false,
|
| 7 |
+
"fix_system1": false,
|
| 8 |
+
"future_action_window_size": 7,
|
| 9 |
+
"hf_token": "hf_token",
|
| 10 |
+
"image_aug": true,
|
| 11 |
+
"is_resume": true,
|
| 12 |
+
"load_all_data_for_training": true,
|
| 13 |
+
"num_of_meta_query": 64,
|
| 14 |
+
"past_action_window_size": 0,
|
| 15 |
+
"pretrained_checkpoint": "/mnt/petrelfs/yangshuai1/rep/InstructVLA_official/outputs/libero_wrist/sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1/checkpoints/step-025500-epoch-125-loss=0.0168.pt",
|
| 16 |
+
"repeated_diffusion_steps": 4,
|
| 17 |
+
"resume_epoch": 125,
|
| 18 |
+
"resume_step": 25500,
|
| 19 |
+
"run_id": "sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1",
|
| 20 |
+
"run_id_note": null,
|
| 21 |
+
"run_root_dir": "outputs/libero_wrist",
|
| 22 |
+
"save_interval": 1500,
|
| 23 |
+
"seed": 42,
|
| 24 |
+
"stage": "stage1",
|
| 25 |
+
"trackers": [
|
| 26 |
+
"jsonl",
|
| 27 |
+
"wandb"
|
| 28 |
+
],
|
| 29 |
+
"use_ema": false,
|
| 30 |
+
"use_mm": false,
|
| 31 |
+
"vla": {
|
| 32 |
+
"action_tokenizer": "extra_action_tokenizer",
|
| 33 |
+
"base_vlm": "/mnt/petrelfs/yangshuai1/yangshuai1/share_mllm/Eagle2-2B",
|
| 34 |
+
"data_mix": "libero_goal_no_noops",
|
| 35 |
+
"enable_gradient_checkpointing": true,
|
| 36 |
+
"enable_mixed_precision_training": true,
|
| 37 |
+
"epochs": 100,
|
| 38 |
+
"expected_world_size": 8,
|
| 39 |
+
"freeze_llm_backbone": false,
|
| 40 |
+
"freeze_vision_backbone": false,
|
| 41 |
+
"global_batch_size": 256,
|
| 42 |
+
"learning_rate": 5e-05,
|
| 43 |
+
"lr_scheduler_type": "constant",
|
| 44 |
+
"max_grad_norm": 1.0,
|
| 45 |
+
"max_steps": null,
|
| 46 |
+
"per_device_batch_size": 32,
|
| 47 |
+
"reduce_in_full_precision": true,
|
| 48 |
+
"shuffle_buffer_size": 250000,
|
| 49 |
+
"train_strategy": "fsdp-full-shard",
|
| 50 |
+
"type": "prism-qwen25-dinosiglip-224px+0_5b",
|
| 51 |
+
"unfreeze_last_llm_layer": false,
|
| 52 |
+
"vla_id": "prism-qwen25-dinosiglip-224px+0_5b",
|
| 53 |
+
"warmup_ratio": 0.0,
|
| 54 |
+
"weight_decay": 0.0
|
| 55 |
+
},
|
| 56 |
+
"wandb_entity": "shuaiyang2003",
|
| 57 |
+
"wandb_project": "dual_sys_libero",
|
| 58 |
+
"with_pointing": true
|
| 59 |
+
}
|
config.yaml
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
action_dim: 7
|
| 2 |
+
action_model_type: DiT-B
|
| 3 |
+
data_root_dir: /mnt/inspurfs/efm_t/robot_data/cache/LIBERO/dataset
|
| 4 |
+
debug: false
|
| 5 |
+
disable_instruction: false
|
| 6 |
+
fix_system1: false
|
| 7 |
+
future_action_window_size: 7
|
| 8 |
+
hf_token: hf_token
|
| 9 |
+
image_aug: true
|
| 10 |
+
is_resume: true
|
| 11 |
+
load_all_data_for_training: true
|
| 12 |
+
num_of_meta_query: 64
|
| 13 |
+
past_action_window_size: 0
|
| 14 |
+
pretrained_checkpoint: /mnt/petrelfs/yangshuai1/rep/InstructVLA_official/outputs/libero_wrist/sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1/checkpoints/step-025500-epoch-125-loss=0.0168.pt
|
| 15 |
+
repeated_diffusion_steps: 4
|
| 16 |
+
resume_epoch: 125
|
| 17 |
+
resume_step: 25500
|
| 18 |
+
run_id: sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1
|
| 19 |
+
run_id_note: null
|
| 20 |
+
run_root_dir: outputs/libero_wrist
|
| 21 |
+
save_interval: 1500
|
| 22 |
+
seed: 42
|
| 23 |
+
stage: stage1
|
| 24 |
+
trackers:
|
| 25 |
+
- jsonl
|
| 26 |
+
- wandb
|
| 27 |
+
use_ema: false
|
| 28 |
+
use_mm: false
|
| 29 |
+
vla:
|
| 30 |
+
action_tokenizer: extra_action_tokenizer
|
| 31 |
+
base_vlm: /mnt/petrelfs/yangshuai1/yangshuai1/share_mllm/Eagle2-2B
|
| 32 |
+
data_mix: libero_goal_no_noops
|
| 33 |
+
enable_gradient_checkpointing: true
|
| 34 |
+
enable_mixed_precision_training: true
|
| 35 |
+
epochs: 100
|
| 36 |
+
expected_world_size: 8
|
| 37 |
+
freeze_llm_backbone: false
|
| 38 |
+
freeze_vision_backbone: false
|
| 39 |
+
global_batch_size: 256
|
| 40 |
+
learning_rate: 5.0e-05
|
| 41 |
+
lr_scheduler_type: constant
|
| 42 |
+
max_grad_norm: 1.0
|
| 43 |
+
max_steps: null
|
| 44 |
+
per_device_batch_size: 32
|
| 45 |
+
reduce_in_full_precision: true
|
| 46 |
+
shuffle_buffer_size: 250000
|
| 47 |
+
train_strategy: fsdp-full-shard
|
| 48 |
+
type: prism-qwen25-dinosiglip-224px+0_5b
|
| 49 |
+
unfreeze_last_llm_layer: false
|
| 50 |
+
vla_id: prism-qwen25-dinosiglip-224px+0_5b
|
| 51 |
+
warmup_ratio: 0.0
|
| 52 |
+
weight_decay: 0.0
|
| 53 |
+
wandb_entity: shuaiyang2003
|
| 54 |
+
wandb_project: dual_sys_libero
|
| 55 |
+
with_pointing: true
|
dataset_statistics.json
ADDED
|
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"libero_goal_no_noops": {
|
| 3 |
+
"action": {
|
| 4 |
+
"mean": [
|
| 5 |
+
0.04721052572131157,
|
| 6 |
+
0.028835246339440346,
|
| 7 |
+
-0.1485840231180191,
|
| 8 |
+
-0.0025010062381625175,
|
| 9 |
+
0.026408178731799126,
|
| 10 |
+
0.027379808947443962,
|
| 11 |
+
0.6299911737442017
|
| 12 |
+
],
|
| 13 |
+
"std": [
|
| 14 |
+
0.3968801498413086,
|
| 15 |
+
0.3473387360572815,
|
| 16 |
+
0.49239858984947205,
|
| 17 |
+
0.055331431329250336,
|
| 18 |
+
0.07844757288694382,
|
| 19 |
+
0.10008802264928818,
|
| 20 |
+
0.48270025849342346
|
| 21 |
+
],
|
| 22 |
+
"max": [
|
| 23 |
+
0.9375,
|
| 24 |
+
0.9375,
|
| 25 |
+
0.9375,
|
| 26 |
+
0.3557142913341522,
|
| 27 |
+
0.375,
|
| 28 |
+
0.375,
|
| 29 |
+
1.0
|
| 30 |
+
],
|
| 31 |
+
"min": [
|
| 32 |
+
-0.9375,
|
| 33 |
+
-0.9375,
|
| 34 |
+
-0.9375,
|
| 35 |
+
-0.2582142949104309,
|
| 36 |
+
-0.375,
|
| 37 |
+
-0.2871428430080414,
|
| 38 |
+
0.0
|
| 39 |
+
],
|
| 40 |
+
"q01": [
|
| 41 |
+
-0.8785714507102966,
|
| 42 |
+
-0.7553571462631226,
|
| 43 |
+
-0.9375,
|
| 44 |
+
-0.1510714292526245,
|
| 45 |
+
-0.1639285683631897,
|
| 46 |
+
-0.13777500048279764,
|
| 47 |
+
0.0
|
| 48 |
+
],
|
| 49 |
+
"q99": [
|
| 50 |
+
0.9375,
|
| 51 |
+
0.9107142686843872,
|
| 52 |
+
0.9375,
|
| 53 |
+
0.20357142388820648,
|
| 54 |
+
0.26357144117355347,
|
| 55 |
+
0.375,
|
| 56 |
+
1.0
|
| 57 |
+
],
|
| 58 |
+
"mask": [
|
| 59 |
+
true,
|
| 60 |
+
true,
|
| 61 |
+
true,
|
| 62 |
+
true,
|
| 63 |
+
true,
|
| 64 |
+
true,
|
| 65 |
+
false
|
| 66 |
+
]
|
| 67 |
+
},
|
| 68 |
+
"proprio": {
|
| 69 |
+
"mean": [
|
| 70 |
+
-0.09923473745584488,
|
| 71 |
+
0.013597904704511166,
|
| 72 |
+
1.0694637298583984,
|
| 73 |
+
2.82898211479187,
|
| 74 |
+
0.30799180269241333,
|
| 75 |
+
-0.274286687374115,
|
| 76 |
+
0.028092455118894577,
|
| 77 |
+
-0.027339335530996323
|
| 78 |
+
],
|
| 79 |
+
"std": [
|
| 80 |
+
0.11653962731361389,
|
| 81 |
+
0.11478105187416077,
|
| 82 |
+
0.10487838834524155,
|
| 83 |
+
0.5570293664932251,
|
| 84 |
+
0.7221656441688538,
|
| 85 |
+
0.36479514837265015,
|
| 86 |
+
0.01507475133985281,
|
| 87 |
+
0.014990941621363163
|
| 88 |
+
],
|
| 89 |
+
"max": [
|
| 90 |
+
0.13579000532627106,
|
| 91 |
+
0.33316105604171753,
|
| 92 |
+
1.3660105466842651,
|
| 93 |
+
3.473310708999634,
|
| 94 |
+
2.6688623428344727,
|
| 95 |
+
0.8255361318588257,
|
| 96 |
+
0.04233968257904053,
|
| 97 |
+
0.0010111660230904818
|
| 98 |
+
],
|
| 99 |
+
"min": [
|
| 100 |
+
-0.46141114830970764,
|
| 101 |
+
-0.30129560828208923,
|
| 102 |
+
0.9083037972450256,
|
| 103 |
+
0.35277295112609863,
|
| 104 |
+
-1.4858465194702148,
|
| 105 |
+
-1.5227035284042358,
|
| 106 |
+
-0.0013586411951109767,
|
| 107 |
+
-0.042040832340717316
|
| 108 |
+
],
|
| 109 |
+
"q01": [
|
| 110 |
+
-0.42401049643754957,
|
| 111 |
+
-0.27338370531797407,
|
| 112 |
+
0.911226047873497,
|
| 113 |
+
1.3085840785503386,
|
| 114 |
+
-0.691297555565834,
|
| 115 |
+
-1.130668159723282,
|
| 116 |
+
0.0016738151130266487,
|
| 117 |
+
-0.040336399003863335
|
| 118 |
+
],
|
| 119 |
+
"q99": [
|
| 120 |
+
0.08990443304181095,
|
| 121 |
+
0.26473945528268716,
|
| 122 |
+
1.2910678112506866,
|
| 123 |
+
3.2425890421867365,
|
| 124 |
+
2.3376442337036116,
|
| 125 |
+
0.4659483411908149,
|
| 126 |
+
0.040610933862626555,
|
| 127 |
+
-0.0015016929572448147
|
| 128 |
+
]
|
| 129 |
+
},
|
| 130 |
+
"num_transitions": 52042,
|
| 131 |
+
"num_trajectories": 428
|
| 132 |
+
}
|
| 133 |
+
}
|
eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_23-step-039000-epoch-192-loss=0.0263.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_28-step-039000-epoch-192-loss=0.0263.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval/EVAL-libero_goal-instruct_vla-2025_09_08-15_42_40-step-039000-epoch-192-loss=0.0263.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
run-metrics.jsonl
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"hparams": {"action_dim": 7, "action_model_type": "DiT-B", "data_root_dir": "/mnt/inspurfs/efm_t/robot_data/cache/LIBERO/dataset", "debug": false, "disable_instruction": false, "fix_system1": false, "future_action_window_size": 7, "hf_token": "hf_token", "image_aug": true, "is_resume": true, "load_all_data_for_training": true, "num_of_meta_query": 64, "past_action_window_size": 0, "pretrained_checkpoint": "/mnt/petrelfs/yangshuai1/rep/InstructVLA_official/outputs/libero_wrist/sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1/checkpoints/step-025500-epoch-125-loss=0.0168.pt", "repeated_diffusion_steps": 4, "resume_epoch": 125, "resume_step": 25500, "run_id": "sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1", "run_id_note": null, "run_root_dir": "outputs/libero_wrist", "save_interval": 1500, "seed": 42, "stage": "stage1", "trackers": ["jsonl", "wandb"], "use_ema": false, "use_mm": false, "vla": {"action_tokenizer": "extra_action_tokenizer", "base_vlm": "/mnt/petrelfs/yangshuai1/yangshuai1/share_mllm/Eagle2-2B", "data_mix": "libero_goal_no_noops", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "epochs": 100, "expected_world_size": 8, "freeze_llm_backbone": false, "freeze_vision_backbone": false, "global_batch_size": 256, "learning_rate": 5e-05, "lr_scheduler_type": "constant", "max_grad_norm": 1.0, "max_steps": null, "per_device_batch_size": 32, "reduce_in_full_precision": true, "shuffle_buffer_size": 250000, "train_strategy": "fsdp-full-shard", "type": "prism-qwen25-dinosiglip-224px+0_5b", "unfreeze_last_llm_layer": false, "vla_id": "prism-qwen25-dinosiglip-224px+0_5b", "warmup_ratio": 0.0, "weight_decay": 0.0}, "wandb_entity": "shuaiyang2003", "wandb_project": "dual_sys_libero", "with_pointing": true}, "run_id": "sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1"}
|
sys12_meta_query_action_only_sync_pretraining_v2_query_64_mlp_lora_libero_goal_wrist--image_augstage1.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86e070e1d1e7a6e80810bb4f3358cfca015c05018810a2408d0f52f9c39b3513
|
| 3 |
+
size 14214150
|