lvwerra HF staff commited on
Commit
599cb93
·
1 Parent(s): ac3398e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -4
app.py CHANGED
@@ -252,14 +252,13 @@ css += share_btn_css + monospace_css + ".gradio-container {color: black}"
252
 
253
  description = """
254
  <div style="text-align: center;">
255
- <h1> TRL + TextEnvironment </h1>
256
- <h2> Teaching Language Models to use tools. </h2>
257
  </div>
258
  <div style="text-align: left;">
259
  <p>This is a demo to generate text and code with the following StarCoderBase models:</p>
260
  <ul>
261
- <li><a href="https://huggingface.co/vwxyzjn/starcoderbase-triviaqa" style='color: #e6b800;'>StarCoderBase TriviaQA</a>: A finetuned version of StarCoderBase on on the TriviaQA dataset using reinforcement learning via [TRL's TextEnvironment](https://github.com/huggingface/trl/pull/424)</li>
262
- <li><a href="https://huggingface.co/lvwerra/starcoderbase-gsm8k" style='color: #e6b800;'>StarCoderBase GSM8K</a>: A finetuned version of StarCoderBase on on the GSM8K dataset using reinforcement learning via TRL's [TextEnvironment](https://github.com/huggingface/trl/pull/424).</li>
263
  </ul>
264
  </div>
265
  """
 
252
 
253
  description = """
254
  <div style="text-align: center;">
255
+ <img src="https://huggingface.co/datasets/trl-internal-testing/example-images/resolve/main/images/textenv_demo_banner.png">
 
256
  </div>
257
  <div style="text-align: left;">
258
  <p>This is a demo to generate text and code with the following StarCoderBase models:</p>
259
  <ul>
260
+ <li><a href="https://huggingface.co/vwxyzjn/starcoderbase-triviaqa">StarCoderBase TriviaQA</a>: A finetuned version of StarCoderBase on on the TriviaQA dataset using reinforcement learning via <a href="https://github.com/huggingface/trl/pull/424">TRL's TextEnvironment</a>.</li>
261
+ <li><a href="https://huggingface.co/lvwerra/starcoderbase-gsm8k">StarCoderBase GSM8K</a>: A finetuned version of StarCoderBase on on the GSM8K dataset using reinforcement learning via TRL's <a href="https://github.com/huggingface/trl/pull/424">TRL's TextEnvironment</a>.</li>
262
  </ul>
263
  </div>
264
  """