metadata
license: apache-2.0
library_name: transformers
tags:
- trl
- ppo
- transformers
- reinforcement-learning
TO USE:
from transformers import AutoTokenizer, LlamaForCausalLM
model = LlamaForCausalLM.from_pretrained("hug-me-please/RL_CAMEL")
tokenizer = AutoTokenizer.from_pretrained("hug-me-please/RL_CAMEL")