mirror of
https://github.com/huggingface/lerobot.git
synced 2026-05-20 11:09:59 +00:00
Update reward classifier training config (#3147)
Co-authored-by: Khalil Meftah <khalil.meftah@huggingface.co>
This commit is contained in:
+26
-2
@@ -685,6 +685,10 @@ Example configuration for training the [reward classifier](https://huggingface.c
|
|||||||
|
|
||||||
```json
|
```json
|
||||||
{
|
{
|
||||||
|
"dataset": {
|
||||||
|
"repo_id": "hf_username/dataset_name",
|
||||||
|
"root": null
|
||||||
|
},
|
||||||
"policy": {
|
"policy": {
|
||||||
"type": "reward_classifier",
|
"type": "reward_classifier",
|
||||||
"model_name": "helper2424/resnet10",
|
"model_name": "helper2424/resnet10",
|
||||||
@@ -705,8 +709,28 @@ Example configuration for training the [reward classifier](https://huggingface.c
|
|||||||
"type": "VISUAL",
|
"type": "VISUAL",
|
||||||
"shape": [3, 128, 128]
|
"shape": [3, 128, 128]
|
||||||
}
|
}
|
||||||
}
|
},
|
||||||
}
|
"push_to_hub": true,
|
||||||
|
"repo_id": "hf_username/model_repo"
|
||||||
|
},
|
||||||
|
"batch_size": 16,
|
||||||
|
"num_workers": 4,
|
||||||
|
"steps": 5000,
|
||||||
|
"log_freq": 10,
|
||||||
|
"eval_freq": 1000,
|
||||||
|
"save_freq": 1000,
|
||||||
|
"save_checkpoint": true,
|
||||||
|
"seed": 2,
|
||||||
|
"resume": false,
|
||||||
|
"optimizer": {
|
||||||
|
"grad_clip_norm": 10.0
|
||||||
|
},
|
||||||
|
"wandb": {
|
||||||
|
"enable": true,
|
||||||
|
"project": "reward-classifier",
|
||||||
|
"disable_artifact": false
|
||||||
|
},
|
||||||
|
"job_name": "reward-classifier"
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user