-
Notifications
You must be signed in to change notification settings - Fork 4
/
fg-rlhf.yml
81 lines (74 loc) 路 2.57 KB
/
fg-rlhf.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
template_name: fg-rlhf
template_label: Wu et al., 2023
template_description: Fine-grained human feedback typology introduced by Wu et al., 2023 for RLHF
# ========================================================================================
#
# This typology is used as part of a RLHF pipeline for fine-tuning a LLM as a QA system.
# The original interface had annotators select missing info at the bottom of the interface
# instead of selecting the relevant span in the passage. See Figures 5 & 6 in App. C of
# Wu et al., 2023 for details.
#
# ========================================================================================
interface_text:
typology:
context_label: ""
source_label: "Reference Answer"
target_label: "Generation"
font_size:
source: 16
target: 16
edits:
- name: factual
label: "Factual Error"
enable_output: true
color: red
icon: fa-x
annotation:
- name: factual_error
question: "Select the factual/language error."
options:
- name: irrelevant
label: "Irrelevant"
- name: repetitive
label: "Repetitive"
- name: inconsistent
label: "Inconsistent"
- name: unverifiable
label: "Unverifiable Fact"
- name: incoherent
label: "Incoherent"
- name: explanation
label: "Explanation"
question: "Explain your selection."
options: textarea
required: false
- name: missing_info
label: "Missing Info"
icon: fa-question
color: blue
annotation:
- name: missing_info_error
question: "Select the missing info error."
options:
- name: missing_answer
label: "Missing Answer"
- name: missing_major_auxiliary
label: "Missing Major Auxiliary Info"
- name: missing_minor_auxiliary
label: "Missing Minor Auxiliary Info"
- name: passage_id
label: "Passage"
question: "In which passage does this occur?"
options: textbox
- name: sentence_id
label: "Sentence"
question: "In which sentence contains the missing info?"
options: textbox
paper_link: https://arxiv.org/abs/2306.01693
citation: |
@article{wu2023fine,
title={Fine-Grained Human Feedback Gives Better Rewards for Language Model Training},
author={Wu, Zeqiu and Hu, Yushi and Shi, Weijia and Dziri, Nouha and Suhr, Alane and Ammanabrolu, Prithviraj and Smith, Noah A and Ostendorf, Mari and Hajishirzi, Hannaneh},
journal={arXiv preprint arXiv:2306.01693},
year={2023}
}