Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

pretrained_model/config.json +84 -0
pretrained_model/model.safetensors +3 -0
pretrained_model/policy_postprocessor.json +32 -0
pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors +3 -0
pretrained_model/policy_preprocessor.json +81 -0
pretrained_model/policy_preprocessor_step_2_normalizer_processor.safetensors +3 -0
pretrained_model/train_config.json +276 -0

pretrained_model/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "type": "vista",
+  "n_obs_steps": 1,
+  "input_features": {
+    "observation.state": {
+      "type": "STATE",
+      "shape": [
+        16
+      ]
+    },
+    "observation.images.left_wrist": {
+      "type": "VISUAL",
+      "shape": [
+        3,
+        224,
+        224
+      ]
+    },
+    "observation.images.right_wrist": {
+      "type": "VISUAL",
+      "shape": [
+        3,
+        224,
+        224
+      ]
+    }
+  },
+  "output_features": {
+    "action": {
+      "type": "ACTION",
+      "shape": [
+        16
+      ]
+    }
+  },
+  "device": "cuda",
+  "use_amp": false,
+  "use_delta_action": true,
+  "push_to_hub": false,
+  "repo_id": null,
+  "private": null,
+  "tags": null,
+  "license": null,
+  "pretrained_path": "/data/ysy/data/models/umi_0312_40w",
+  "paligemma_variant": "gemma_2b",
+  "action_expert_variant": "gemma_300m",
+  "dtype": "bfloat16",
+  "chunk_size": 50,
+  "n_action_steps": 50,
+  "max_state_dim": 32,
+  "max_action_dim": 32,
+  "num_inference_steps": 10,
+  "time_sampling_beta_alpha": 1.5,
+  "time_sampling_beta_beta": 1.0,
+  "time_sampling_scale": 0.999,
+  "time_sampling_offset": 0.001,
+  "min_period": 0.004,
+  "max_period": 4.0,
+  "image_resolution": [
+    224,
+    224
+  ],
+  "empty_cameras": 0,
+  "tokenizer_max_length": 200,
+  "normalization_mapping": {
+    "VISUAL": "IDENTITY",
+    "STATE": "QUANTILES",
+    "ACTION": "QUANTILES"
+  },
+  "gradient_checkpointing": false,
+  "compile_model": false,
+  "compile_mode": "max-autotune",
+  "optimizer_lr": 2.5e-05,
+  "optimizer_betas": [
+    0.9,
+    0.95
+  ],
+  "optimizer_eps": 1e-08,
+  "optimizer_weight_decay": 0.01,
+  "optimizer_grad_clip_norm": 1.0,
+  "scheduler_warmup_steps": 1000,
+  "scheduler_decay_steps": 300000,
+  "scheduler_decay_lr": 2.5e-06
+}

pretrained_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b92361ce0150cf73773b6b8c966937942435aa02c8ed541f3ea3bd78edd1949
+size 7473096344

pretrained_model/policy_postprocessor.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "name": "policy_postprocessor",
+  "steps": [
+    {
+      "registry_name": "unnormalizer_processor",
+      "config": {
+        "eps": 1e-08,
+        "features": {
+          "action": {
+            "type": "ACTION",
+            "shape": [
+              16
+            ]
+          }
+        },
+        "norm_map": {
+          "VISUAL": "IDENTITY",
+          "STATE": "QUANTILES",
+          "ACTION": "QUANTILES"
+        }
+      },
+      "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors"
+    },
+    {
+      "registry_name": "device_processor",
+      "config": {
+        "device": "cuda",
+        "float_dtype": null
+      }
+    }
+  ]
+}

pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe9b5c1fd200eb6ea91c2adbe2c77b2d6acd425636ef033c9a99b98443b7be6f
+size 6748

pretrained_model/policy_preprocessor.json ADDED Viewed

	@@ -0,0 +1,81 @@

+{
+  "name": "policy_preprocessor",
+  "steps": [
+    {
+      "registry_name": "rename_observations_processor",
+      "config": {
+        "rename_map": {}
+      }
+    },
+    {
+      "registry_name": "to_batch_processor",
+      "config": {}
+    },
+    {
+      "registry_name": "normalizer_processor",
+      "config": {
+        "eps": 1e-08,
+        "features": {
+          "observation.state": {
+            "type": "STATE",
+            "shape": [
+              16
+            ]
+          },
+          "observation.images.robot_0": {
+            "type": "VISUAL",
+            "shape": [
+              3,
+              224,
+              224
+            ]
+          },
+          "observation.images.robot_1": {
+            "type": "VISUAL",
+            "shape": [
+              3,
+              224,
+              224
+            ]
+          },
+          "action": {
+            "type": "ACTION",
+            "shape": [
+              16
+            ]
+          }
+        },
+        "norm_map": {
+          "VISUAL": "IDENTITY",
+          "STATE": "QUANTILES",
+          "ACTION": "QUANTILES"
+        }
+      },
+      "state_file": "policy_preprocessor_step_2_normalizer_processor.safetensors"
+    },
+    {
+      "registry_name": "vista_prepare_state_tokenizer_processor_step",
+      "config": {
+        "max_state_dim": 16
+      }
+    },
+    {
+      "registry_name": "tokenizer_processor",
+      "config": {
+        "max_length": 200,
+        "task_key": "task",
+        "padding_side": "right",
+        "padding": "max_length",
+        "truncation": true,
+        "tokenizer_name": "/data/ysy/data/models/plgm3b"
+      }
+    },
+    {
+      "registry_name": "device_processor",
+      "config": {
+        "device": "cuda",
+        "float_dtype": null
+      }
+    }
+  ]
+}

pretrained_model/policy_preprocessor_step_2_normalizer_processor.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe9b5c1fd200eb6ea91c2adbe2c77b2d6acd425636ef033c9a99b98443b7be6f
+size 6748

pretrained_model/train_config.json ADDED Viewed

	@@ -0,0 +1,276 @@

+{
+  "dataset": {
+    "repo_id": null,
+    "root": "/data/ysy/data/lerobot_pretrain_used",
+    "episodes": null,
+    "image_transforms": {
+      "enable": true,
+      "max_num_transforms": 3,
+      "random_order": false,
+      "tfs": {
+        "brightness": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "brightness": [
+              0.8,
+              1.2
+            ]
+          }
+        },
+        "contrast": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "contrast": [
+              0.8,
+              1.2
+            ]
+          }
+        },
+        "saturation": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "saturation": [
+              0.5,
+              1.5
+            ]
+          }
+        },
+        "hue": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "hue": [
+              -0.05,
+              0.05
+            ]
+          }
+        },
+        "sharpness": {
+          "weight": 1.0,
+          "type": "SharpnessJitter",
+          "kwargs": {
+            "sharpness": [
+              0.5,
+              1.5
+            ]
+          }
+        },
+        "affine": {
+          "weight": 1.0,
+          "type": "RandomAffine",
+          "kwargs": {
+            "degrees": [
+              -5.0,
+              5.0
+            ],
+            "translate": [
+              0.05,
+              0.05
+            ]
+          }
+        }
+      }
+    },
+    "wrist_transforms": {
+      "enable": true,
+      "max_num_transforms": 3,
+      "random_order": false,
+      "tfs": {
+        "brightness": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "brightness": [
+              0.8,
+              1.2
+            ]
+          }
+        },
+        "contrast": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "contrast": [
+              0.8,
+              1.2
+            ]
+          }
+        },
+        "saturation": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "saturation": [
+              0.5,
+              1.5
+            ]
+          }
+        },
+        "hue": {
+          "weight": 1.0,
+          "type": "ColorJitter",
+          "kwargs": {
+            "hue": [
+              -0.05,
+              0.05
+            ]
+          }
+        },
+        "sharpness": {
+          "weight": 1.0,
+          "type": "SharpnessJitter",
+          "kwargs": {
+            "sharpness": [
+              0.5,
+              1.5
+            ]
+          }
+        }
+      }
+    },
+    "revision": "v2.0",
+    "use_imagenet_stats": true,
+    "video_backend": "torchcodec",
+    "streaming": false
+  },
+  "env": null,
+  "policy": {
+    "type": "vista",
+    "n_obs_steps": 1,
+    "input_features": {
+      "observation.state": {
+        "type": "STATE",
+        "shape": [
+          16
+        ]
+      },
+      "observation.images.left_wrist": {
+        "type": "VISUAL",
+        "shape": [
+          3,
+          224,
+          224
+        ]
+      },
+      "observation.images.right_wrist": {
+        "type": "VISUAL",
+        "shape": [
+          3,
+          224,
+          224
+        ]
+      }
+    },
+    "output_features": {
+      "action": {
+        "type": "ACTION",
+        "shape": [
+          16
+        ]
+      }
+    },
+    "device": "cuda",
+    "use_amp": false,
+    "use_delta_action": true,
+    "push_to_hub": false,
+    "repo_id": null,
+    "private": null,
+    "tags": null,
+    "license": null,
+    "pretrained_path": "/data/ysy/data/models/umi_0312_40w",
+    "paligemma_variant": "gemma_2b",
+    "action_expert_variant": "gemma_300m",
+    "dtype": "bfloat16",
+    "chunk_size": 50,
+    "n_action_steps": 50,
+    "max_state_dim": 32,
+    "max_action_dim": 32,
+    "num_inference_steps": 10,
+    "time_sampling_beta_alpha": 1.5,
+    "time_sampling_beta_beta": 1.0,
+    "time_sampling_scale": 0.999,
+    "time_sampling_offset": 0.001,
+    "min_period": 0.004,
+    "max_period": 4.0,
+    "image_resolution": [
+      224,
+      224
+    ],
+    "empty_cameras": 0,
+    "tokenizer_max_length": 200,
+    "normalization_mapping": {
+      "VISUAL": "IDENTITY",
+      "STATE": "QUANTILES",
+      "ACTION": "QUANTILES"
+    },
+    "gradient_checkpointing": false,
+    "compile_model": false,
+    "compile_mode": "max-autotune",
+    "optimizer_lr": 2.5e-05,
+    "optimizer_betas": [
+      0.9,
+      0.95
+    ],
+    "optimizer_eps": 1e-08,
+    "optimizer_weight_decay": 0.01,
+    "optimizer_grad_clip_norm": 1.0,
+    "scheduler_warmup_steps": 1000,
+    "scheduler_decay_steps": 300000,
+    "scheduler_decay_lr": 2.5e-06
+  },
+  "output_dir": "/data/ysy/data/train_output/pre_s2/lerobot_pretrain_used/26-04-23_04-23-37_pi05_gpu8_ck50_lr2_5e-5_bs24_s300K_seed42",
+  "job_name": "vista",
+  "resume": false,
+  "seed": 42,
+  "num_workers": 8,
+  "batch_size": 24,
+  "steps": 300000,
+  "eval_freq": 5000,
+  "log_freq": 50,
+  "save_checkpoint": true,
+  "save_freq": 20000,
+  "use_policy_training_preset": true,
+  "optimizer": {
+    "type": "adamw",
+    "lr": 2.5e-05,
+    "weight_decay": 0.01,
+    "grad_clip_norm": 1.0,
+    "betas": [
+      0.9,
+      0.95
+    ],
+    "eps": 1e-08
+  },
+  "scheduler": {
+    "type": "cosine_decay_with_warmup",
+    "num_warmup_steps": 1000,
+    "num_decay_steps": 300000,
+    "peak_lr": 2.5e-05,
+    "decay_lr": 2.5e-06
+  },
+  "eval": {
+    "n_episodes": 50,
+    "batch_size": 50,
+    "use_async_envs": false
+  },
+  "wandb": {
+    "enable": false,
+    "disable_artifact": false,
+    "project": "lerobot",
+    "entity": null,
+    "notes": null,
+    "run_id": null,
+    "mode": null
+  },
+  "checkpoint_path": null,
+  "rename_map": {},
+  "accelerator_logging_dir": "accelerate_logs",
+  "mixed_precision": "bf16",
+  "enforce_input_output_replace": true,
+  "gradient_checkpointing": false,
+  "save_as_safetensors": true,
+  "load_from_safetensors": true
+}