Text Classification
Transformers
PyTorch
English
electra
reward-model
reward_model
RLHF
Inference Endpoints
Files changed (1) hide show
  1. README.md +17 -0
README.md CHANGED
@@ -4,14 +4,31 @@ datasets:
4
  - openai/webgpt_comparisons
5
  - openai/summarize_from_feedback
6
  - Dahoas/instruct-synthetic-prompt-responses
 
 
 
 
7
  language:
8
  - en
 
 
 
 
 
9
  metrics:
10
  - accuracy
 
11
  tags:
12
  - reward-model
13
  - reward_model
14
  - RLHF
 
 
 
 
 
 
 
15
  ---
16
  # Reward model trained from human feedback
17
 
 
4
  - openai/webgpt_comparisons
5
  - openai/summarize_from_feedback
6
  - Dahoas/instruct-synthetic-prompt-responses
7
+ - Open-Orca/OpenOrca
8
+ - OpenAssistant/oasst1
9
+ - openchat/openchat_sharegpt4_dataset
10
+ - fka/awesome-chatgpt-prompts
11
  language:
12
  - en
13
+ - es
14
+ - kr
15
+ - lo
16
+ - ko
17
+ - ja
18
  metrics:
19
  - accuracy
20
+ - character
21
  tags:
22
  - reward-model
23
  - reward_model
24
  - RLHF
25
+ - art
26
+ - code
27
+ - finance
28
+ - chemistry
29
+ - biology
30
+ library_name: diffusers
31
+ pipeline_tag: token-classification
32
  ---
33
  # Reward model trained from human feedback
34