Upload policy weights, train config and readme
Browse files- README.md +63 -0
- config.json +96 -0
- model.safetensors +3 -0
- train_config.json +208 -0
    	
        README.md
    ADDED
    
    | @@ -0,0 +1,63 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            ---
         | 
| 2 | 
            +
            base_model: lerobot/smolvla_base
         | 
| 3 | 
            +
            datasets: eliasab16/grab_and_insert_with_recovery_method_1
         | 
| 4 | 
            +
            library_name: lerobot
         | 
| 5 | 
            +
            license: apache-2.0
         | 
| 6 | 
            +
            model_name: smolvla
         | 
| 7 | 
            +
            pipeline_tag: robotics
         | 
| 8 | 
            +
            tags:
         | 
| 9 | 
            +
            - smolvla
         | 
| 10 | 
            +
            - robotics
         | 
| 11 | 
            +
            - lerobot
         | 
| 12 | 
            +
            ---
         | 
| 13 | 
            +
             | 
| 14 | 
            +
            # Model Card for smolvla
         | 
| 15 | 
            +
             | 
| 16 | 
            +
            <!-- Provide a quick summary of what the model is/does. -->
         | 
| 17 | 
            +
             | 
| 18 | 
            +
             | 
| 19 | 
            +
            [SmolVLA](https://huggingface.co/papers/2506.01844) is a compact, efficient vision-language-action model that achieves competitive performance at reduced computational costs and can be deployed on consumer-grade hardware.
         | 
| 20 | 
            +
             | 
| 21 | 
            +
             | 
| 22 | 
            +
            This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
         | 
| 23 | 
            +
            See the full documentation at [LeRobot Docs](https://huggingface.co/docs/lerobot/index).
         | 
| 24 | 
            +
             | 
| 25 | 
            +
            ---
         | 
| 26 | 
            +
             | 
| 27 | 
            +
            ## How to Get Started with the Model
         | 
| 28 | 
            +
             | 
| 29 | 
            +
            For a complete walkthrough, see the [training guide](https://huggingface.co/docs/lerobot/il_robots#train-a-policy).
         | 
| 30 | 
            +
            Below is the short version on how to train and run inference/eval:
         | 
| 31 | 
            +
             | 
| 32 | 
            +
            ### Train from scratch
         | 
| 33 | 
            +
             | 
| 34 | 
            +
            ```bash
         | 
| 35 | 
            +
            lerobot-train \
         | 
| 36 | 
            +
              --dataset.repo_id=${HF_USER}/<dataset> \
         | 
| 37 | 
            +
              --policy.type=act \
         | 
| 38 | 
            +
              --output_dir=outputs/train/<desired_policy_repo_id> \
         | 
| 39 | 
            +
              --job_name=lerobot_training \
         | 
| 40 | 
            +
              --policy.device=cuda \
         | 
| 41 | 
            +
              --policy.repo_id=${HF_USER}/<desired_policy_repo_id>
         | 
| 42 | 
            +
              --wandb.enable=true
         | 
| 43 | 
            +
            ```
         | 
| 44 | 
            +
             | 
| 45 | 
            +
            _Writes checkpoints to `outputs/train/<desired_policy_repo_id>/checkpoints/`._
         | 
| 46 | 
            +
             | 
| 47 | 
            +
            ### Evaluate the policy/run inference
         | 
| 48 | 
            +
             | 
| 49 | 
            +
            ```bash
         | 
| 50 | 
            +
            lerobot-record \
         | 
| 51 | 
            +
              --robot.type=so100_follower \
         | 
| 52 | 
            +
              --dataset.repo_id=<hf_user>/eval_<dataset> \
         | 
| 53 | 
            +
              --policy.path=<hf_user>/<desired_policy_repo_id> \
         | 
| 54 | 
            +
              --episodes=10
         | 
| 55 | 
            +
            ```
         | 
| 56 | 
            +
             | 
| 57 | 
            +
            Prefix the dataset repo with **eval\_** and supply `--policy.path` pointing to a local or hub checkpoint.
         | 
| 58 | 
            +
             | 
| 59 | 
            +
            ---
         | 
| 60 | 
            +
             | 
| 61 | 
            +
            ## Model Details
         | 
| 62 | 
            +
             | 
| 63 | 
            +
            - **License:** apache-2.0
         | 
    	
        config.json
    ADDED
    
    | @@ -0,0 +1,96 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "type": "smolvla",
         | 
| 3 | 
            +
                "n_obs_steps": 1,
         | 
| 4 | 
            +
                "normalization_mapping": {
         | 
| 5 | 
            +
                    "VISUAL": "IDENTITY",
         | 
| 6 | 
            +
                    "STATE": "MEAN_STD",
         | 
| 7 | 
            +
                    "ACTION": "MEAN_STD"
         | 
| 8 | 
            +
                },
         | 
| 9 | 
            +
                "input_features": {
         | 
| 10 | 
            +
                    "observation.state": {
         | 
| 11 | 
            +
                        "type": "STATE",
         | 
| 12 | 
            +
                        "shape": [
         | 
| 13 | 
            +
                            6
         | 
| 14 | 
            +
                        ]
         | 
| 15 | 
            +
                    },
         | 
| 16 | 
            +
                    "observation.images.top_cam": {
         | 
| 17 | 
            +
                        "type": "VISUAL",
         | 
| 18 | 
            +
                        "shape": [
         | 
| 19 | 
            +
                            3,
         | 
| 20 | 
            +
                            600,
         | 
| 21 | 
            +
                            800
         | 
| 22 | 
            +
                        ]
         | 
| 23 | 
            +
                    },
         | 
| 24 | 
            +
                    "observation.images.wrist_bottom_cam": {
         | 
| 25 | 
            +
                        "type": "VISUAL",
         | 
| 26 | 
            +
                        "shape": [
         | 
| 27 | 
            +
                            3,
         | 
| 28 | 
            +
                            600,
         | 
| 29 | 
            +
                            800
         | 
| 30 | 
            +
                        ]
         | 
| 31 | 
            +
                    },
         | 
| 32 | 
            +
                    "observation.images.wrist_top_cam": {
         | 
| 33 | 
            +
                        "type": "VISUAL",
         | 
| 34 | 
            +
                        "shape": [
         | 
| 35 | 
            +
                            3,
         | 
| 36 | 
            +
                            600,
         | 
| 37 | 
            +
                            800
         | 
| 38 | 
            +
                        ]
         | 
| 39 | 
            +
                    }
         | 
| 40 | 
            +
                },
         | 
| 41 | 
            +
                "output_features": {
         | 
| 42 | 
            +
                    "action": {
         | 
| 43 | 
            +
                        "type": "ACTION",
         | 
| 44 | 
            +
                        "shape": [
         | 
| 45 | 
            +
                            6
         | 
| 46 | 
            +
                        ]
         | 
| 47 | 
            +
                    }
         | 
| 48 | 
            +
                },
         | 
| 49 | 
            +
                "device": "cuda",
         | 
| 50 | 
            +
                "use_amp": false,
         | 
| 51 | 
            +
                "push_to_hub": true,
         | 
| 52 | 
            +
                "repo_id": "eliasab16/grab_and_insert_with_recovery_method_1_25k",
         | 
| 53 | 
            +
                "private": null,
         | 
| 54 | 
            +
                "tags": null,
         | 
| 55 | 
            +
                "license": null,
         | 
| 56 | 
            +
                "chunk_size": 50,
         | 
| 57 | 
            +
                "n_action_steps": 50,
         | 
| 58 | 
            +
                "max_state_dim": 32,
         | 
| 59 | 
            +
                "max_action_dim": 32,
         | 
| 60 | 
            +
                "resize_imgs_with_padding": [
         | 
| 61 | 
            +
                    512,
         | 
| 62 | 
            +
                    512
         | 
| 63 | 
            +
                ],
         | 
| 64 | 
            +
                "empty_cameras": 0,
         | 
| 65 | 
            +
                "adapt_to_pi_aloha": false,
         | 
| 66 | 
            +
                "use_delta_joint_actions_aloha": false,
         | 
| 67 | 
            +
                "tokenizer_max_length": 48,
         | 
| 68 | 
            +
                "num_steps": 10,
         | 
| 69 | 
            +
                "use_cache": true,
         | 
| 70 | 
            +
                "freeze_vision_encoder": true,
         | 
| 71 | 
            +
                "train_expert_only": true,
         | 
| 72 | 
            +
                "train_state_proj": true,
         | 
| 73 | 
            +
                "optimizer_lr": 0.0001,
         | 
| 74 | 
            +
                "optimizer_betas": [
         | 
| 75 | 
            +
                    0.9,
         | 
| 76 | 
            +
                    0.95
         | 
| 77 | 
            +
                ],
         | 
| 78 | 
            +
                "optimizer_eps": 1e-08,
         | 
| 79 | 
            +
                "optimizer_weight_decay": 1e-10,
         | 
| 80 | 
            +
                "optimizer_grad_clip_norm": 10.0,
         | 
| 81 | 
            +
                "scheduler_warmup_steps": 1000,
         | 
| 82 | 
            +
                "scheduler_decay_steps": 30000,
         | 
| 83 | 
            +
                "scheduler_decay_lr": 2.5e-06,
         | 
| 84 | 
            +
                "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
         | 
| 85 | 
            +
                "load_vlm_weights": true,
         | 
| 86 | 
            +
                "add_image_special_tokens": false,
         | 
| 87 | 
            +
                "attention_mode": "cross_attn",
         | 
| 88 | 
            +
                "prefix_length": 0,
         | 
| 89 | 
            +
                "pad_language_to": "max_length",
         | 
| 90 | 
            +
                "num_expert_layers": 0,
         | 
| 91 | 
            +
                "num_vlm_layers": 16,
         | 
| 92 | 
            +
                "self_attn_every_n_layers": 2,
         | 
| 93 | 
            +
                "expert_width_multiplier": 0.75,
         | 
| 94 | 
            +
                "min_period": 0.004,
         | 
| 95 | 
            +
                "max_period": 4.0
         | 
| 96 | 
            +
            }
         | 
    	
        model.safetensors
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6e17b4afdfc5462d69f79c1a6c030944d0f8f790ad7628a6752fd028861fcd2e
         | 
| 3 | 
            +
            size 906713296
         | 
    	
        train_config.json
    ADDED
    
    | @@ -0,0 +1,208 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "dataset": {
         | 
| 3 | 
            +
                    "repo_id": "eliasab16/grab_and_insert_with_recovery_method_1",
         | 
| 4 | 
            +
                    "root": null,
         | 
| 5 | 
            +
                    "episodes": null,
         | 
| 6 | 
            +
                    "image_transforms": {
         | 
| 7 | 
            +
                        "enable": false,
         | 
| 8 | 
            +
                        "max_num_transforms": 3,
         | 
| 9 | 
            +
                        "random_order": false,
         | 
| 10 | 
            +
                        "tfs": {
         | 
| 11 | 
            +
                            "brightness": {
         | 
| 12 | 
            +
                                "weight": 1.0,
         | 
| 13 | 
            +
                                "type": "ColorJitter",
         | 
| 14 | 
            +
                                "kwargs": {
         | 
| 15 | 
            +
                                    "brightness": [
         | 
| 16 | 
            +
                                        0.8,
         | 
| 17 | 
            +
                                        1.2
         | 
| 18 | 
            +
                                    ]
         | 
| 19 | 
            +
                                }
         | 
| 20 | 
            +
                            },
         | 
| 21 | 
            +
                            "contrast": {
         | 
| 22 | 
            +
                                "weight": 1.0,
         | 
| 23 | 
            +
                                "type": "ColorJitter",
         | 
| 24 | 
            +
                                "kwargs": {
         | 
| 25 | 
            +
                                    "contrast": [
         | 
| 26 | 
            +
                                        0.8,
         | 
| 27 | 
            +
                                        1.2
         | 
| 28 | 
            +
                                    ]
         | 
| 29 | 
            +
                                }
         | 
| 30 | 
            +
                            },
         | 
| 31 | 
            +
                            "saturation": {
         | 
| 32 | 
            +
                                "weight": 1.0,
         | 
| 33 | 
            +
                                "type": "ColorJitter",
         | 
| 34 | 
            +
                                "kwargs": {
         | 
| 35 | 
            +
                                    "saturation": [
         | 
| 36 | 
            +
                                        0.5,
         | 
| 37 | 
            +
                                        1.5
         | 
| 38 | 
            +
                                    ]
         | 
| 39 | 
            +
                                }
         | 
| 40 | 
            +
                            },
         | 
| 41 | 
            +
                            "hue": {
         | 
| 42 | 
            +
                                "weight": 1.0,
         | 
| 43 | 
            +
                                "type": "ColorJitter",
         | 
| 44 | 
            +
                                "kwargs": {
         | 
| 45 | 
            +
                                    "hue": [
         | 
| 46 | 
            +
                                        -0.05,
         | 
| 47 | 
            +
                                        0.05
         | 
| 48 | 
            +
                                    ]
         | 
| 49 | 
            +
                                }
         | 
| 50 | 
            +
                            },
         | 
| 51 | 
            +
                            "sharpness": {
         | 
| 52 | 
            +
                                "weight": 1.0,
         | 
| 53 | 
            +
                                "type": "SharpnessJitter",
         | 
| 54 | 
            +
                                "kwargs": {
         | 
| 55 | 
            +
                                    "sharpness": [
         | 
| 56 | 
            +
                                        0.5,
         | 
| 57 | 
            +
                                        1.5
         | 
| 58 | 
            +
                                    ]
         | 
| 59 | 
            +
                                }
         | 
| 60 | 
            +
                            }
         | 
| 61 | 
            +
                        }
         | 
| 62 | 
            +
                    },
         | 
| 63 | 
            +
                    "revision": null,
         | 
| 64 | 
            +
                    "use_imagenet_stats": true,
         | 
| 65 | 
            +
                    "video_backend": "torchcodec"
         | 
| 66 | 
            +
                },
         | 
| 67 | 
            +
                "env": null,
         | 
| 68 | 
            +
                "policy": {
         | 
| 69 | 
            +
                    "type": "smolvla",
         | 
| 70 | 
            +
                    "n_obs_steps": 1,
         | 
| 71 | 
            +
                    "normalization_mapping": {
         | 
| 72 | 
            +
                        "VISUAL": "IDENTITY",
         | 
| 73 | 
            +
                        "STATE": "MEAN_STD",
         | 
| 74 | 
            +
                        "ACTION": "MEAN_STD"
         | 
| 75 | 
            +
                    },
         | 
| 76 | 
            +
                    "input_features": {
         | 
| 77 | 
            +
                        "observation.state": {
         | 
| 78 | 
            +
                            "type": "STATE",
         | 
| 79 | 
            +
                            "shape": [
         | 
| 80 | 
            +
                                6
         | 
| 81 | 
            +
                            ]
         | 
| 82 | 
            +
                        },
         | 
| 83 | 
            +
                        "observation.images.top_cam": {
         | 
| 84 | 
            +
                            "type": "VISUAL",
         | 
| 85 | 
            +
                            "shape": [
         | 
| 86 | 
            +
                                3,
         | 
| 87 | 
            +
                                600,
         | 
| 88 | 
            +
                                800
         | 
| 89 | 
            +
                            ]
         | 
| 90 | 
            +
                        },
         | 
| 91 | 
            +
                        "observation.images.wrist_bottom_cam": {
         | 
| 92 | 
            +
                            "type": "VISUAL",
         | 
| 93 | 
            +
                            "shape": [
         | 
| 94 | 
            +
                                3,
         | 
| 95 | 
            +
                                600,
         | 
| 96 | 
            +
                                800
         | 
| 97 | 
            +
                            ]
         | 
| 98 | 
            +
                        },
         | 
| 99 | 
            +
                        "observation.images.wrist_top_cam": {
         | 
| 100 | 
            +
                            "type": "VISUAL",
         | 
| 101 | 
            +
                            "shape": [
         | 
| 102 | 
            +
                                3,
         | 
| 103 | 
            +
                                600,
         | 
| 104 | 
            +
                                800
         | 
| 105 | 
            +
                            ]
         | 
| 106 | 
            +
                        }
         | 
| 107 | 
            +
                    },
         | 
| 108 | 
            +
                    "output_features": {
         | 
| 109 | 
            +
                        "action": {
         | 
| 110 | 
            +
                            "type": "ACTION",
         | 
| 111 | 
            +
                            "shape": [
         | 
| 112 | 
            +
                                6
         | 
| 113 | 
            +
                            ]
         | 
| 114 | 
            +
                        }
         | 
| 115 | 
            +
                    },
         | 
| 116 | 
            +
                    "device": "cuda",
         | 
| 117 | 
            +
                    "use_amp": false,
         | 
| 118 | 
            +
                    "push_to_hub": true,
         | 
| 119 | 
            +
                    "repo_id": "eliasab16/grab_and_insert_with_recovery_method_1_25k",
         | 
| 120 | 
            +
                    "private": null,
         | 
| 121 | 
            +
                    "tags": null,
         | 
| 122 | 
            +
                    "license": null,
         | 
| 123 | 
            +
                    "chunk_size": 50,
         | 
| 124 | 
            +
                    "n_action_steps": 50,
         | 
| 125 | 
            +
                    "max_state_dim": 32,
         | 
| 126 | 
            +
                    "max_action_dim": 32,
         | 
| 127 | 
            +
                    "resize_imgs_with_padding": [
         | 
| 128 | 
            +
                        512,
         | 
| 129 | 
            +
                        512
         | 
| 130 | 
            +
                    ],
         | 
| 131 | 
            +
                    "empty_cameras": 0,
         | 
| 132 | 
            +
                    "adapt_to_pi_aloha": false,
         | 
| 133 | 
            +
                    "use_delta_joint_actions_aloha": false,
         | 
| 134 | 
            +
                    "tokenizer_max_length": 48,
         | 
| 135 | 
            +
                    "num_steps": 10,
         | 
| 136 | 
            +
                    "use_cache": true,
         | 
| 137 | 
            +
                    "freeze_vision_encoder": true,
         | 
| 138 | 
            +
                    "train_expert_only": true,
         | 
| 139 | 
            +
                    "train_state_proj": true,
         | 
| 140 | 
            +
                    "optimizer_lr": 0.0001,
         | 
| 141 | 
            +
                    "optimizer_betas": [
         | 
| 142 | 
            +
                        0.9,
         | 
| 143 | 
            +
                        0.95
         | 
| 144 | 
            +
                    ],
         | 
| 145 | 
            +
                    "optimizer_eps": 1e-08,
         | 
| 146 | 
            +
                    "optimizer_weight_decay": 1e-10,
         | 
| 147 | 
            +
                    "optimizer_grad_clip_norm": 10.0,
         | 
| 148 | 
            +
                    "scheduler_warmup_steps": 1000,
         | 
| 149 | 
            +
                    "scheduler_decay_steps": 30000,
         | 
| 150 | 
            +
                    "scheduler_decay_lr": 2.5e-06,
         | 
| 151 | 
            +
                    "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
         | 
| 152 | 
            +
                    "load_vlm_weights": true,
         | 
| 153 | 
            +
                    "add_image_special_tokens": false,
         | 
| 154 | 
            +
                    "attention_mode": "cross_attn",
         | 
| 155 | 
            +
                    "prefix_length": 0,
         | 
| 156 | 
            +
                    "pad_language_to": "max_length",
         | 
| 157 | 
            +
                    "num_expert_layers": 0,
         | 
| 158 | 
            +
                    "num_vlm_layers": 16,
         | 
| 159 | 
            +
                    "self_attn_every_n_layers": 2,
         | 
| 160 | 
            +
                    "expert_width_multiplier": 0.75,
         | 
| 161 | 
            +
                    "min_period": 0.004,
         | 
| 162 | 
            +
                    "max_period": 4.0
         | 
| 163 | 
            +
                },
         | 
| 164 | 
            +
                "output_dir": "outputs/train",
         | 
| 165 | 
            +
                "job_name": "grab_and_insert_with_recovery_method_1",
         | 
| 166 | 
            +
                "resume": false,
         | 
| 167 | 
            +
                "seed": 1000,
         | 
| 168 | 
            +
                "num_workers": 4,
         | 
| 169 | 
            +
                "batch_size": 64,
         | 
| 170 | 
            +
                "steps": 25000,
         | 
| 171 | 
            +
                "eval_freq": 20000,
         | 
| 172 | 
            +
                "log_freq": 200,
         | 
| 173 | 
            +
                "save_checkpoint": true,
         | 
| 174 | 
            +
                "save_freq": 10000,
         | 
| 175 | 
            +
                "use_policy_training_preset": true,
         | 
| 176 | 
            +
                "optimizer": {
         | 
| 177 | 
            +
                    "type": "adamw",
         | 
| 178 | 
            +
                    "lr": 0.0001,
         | 
| 179 | 
            +
                    "weight_decay": 1e-10,
         | 
| 180 | 
            +
                    "grad_clip_norm": 10.0,
         | 
| 181 | 
            +
                    "betas": [
         | 
| 182 | 
            +
                        0.9,
         | 
| 183 | 
            +
                        0.95
         | 
| 184 | 
            +
                    ],
         | 
| 185 | 
            +
                    "eps": 1e-08
         | 
| 186 | 
            +
                },
         | 
| 187 | 
            +
                "scheduler": {
         | 
| 188 | 
            +
                    "type": "cosine_decay_with_warmup",
         | 
| 189 | 
            +
                    "num_warmup_steps": 1000,
         | 
| 190 | 
            +
                    "num_decay_steps": 30000,
         | 
| 191 | 
            +
                    "peak_lr": 0.0001,
         | 
| 192 | 
            +
                    "decay_lr": 2.5e-06
         | 
| 193 | 
            +
                },
         | 
| 194 | 
            +
                "eval": {
         | 
| 195 | 
            +
                    "n_episodes": 50,
         | 
| 196 | 
            +
                    "batch_size": 50,
         | 
| 197 | 
            +
                    "use_async_envs": false
         | 
| 198 | 
            +
                },
         | 
| 199 | 
            +
                "wandb": {
         | 
| 200 | 
            +
                    "enable": true,
         | 
| 201 | 
            +
                    "disable_artifact": false,
         | 
| 202 | 
            +
                    "project": "lerobot",
         | 
| 203 | 
            +
                    "entity": null,
         | 
| 204 | 
            +
                    "notes": null,
         | 
| 205 | 
            +
                    "run_id": "3tv3o8c5",
         | 
| 206 | 
            +
                    "mode": null
         | 
| 207 | 
            +
                }
         | 
| 208 | 
            +
            }
         |