Update README.md
Browse filesadding TRL citation
README.md
CHANGED
@@ -42,4 +42,16 @@ Please convert the following legal content into a short human-readable summary<|
|
|
42 |
|
43 |
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
|
44 |
outputs = model.generate(**inputs, max_new_tokens=128)
|
45 |
-
print(tokenizer.decode(outputs[0], skip_special_tokens=True))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
|
43 |
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
|
44 |
outputs = model.generate(**inputs, max_new_tokens=128)
|
45 |
+
print(tokenizer.decode(outputs[0], skip_special_tokens=True))
|
46 |
+
|
47 |
+
## 📚 Citations
|
48 |
+
|
49 |
+
```bibtex
|
50 |
+
@misc{vonwerra2022trl,
|
51 |
+
title = {{TRL: Transformer Reinforcement Learning}},
|
52 |
+
author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
|
53 |
+
year = 2020,
|
54 |
+
journal = {GitHub repository},
|
55 |
+
publisher = {GitHub},
|
56 |
+
howpublished = {\url{https://github.com/huggingface/trl}}
|
57 |
+
}
|