Spaces:
Sleeping
Sleeping
Commit
·
12d4c5a
1
Parent(s):
097d2a9
update instruction
Browse files- eval_round_r1.db +3 -0
- src/eval_server.py +1 -14
- src/instuction_md.py +2 -1
eval_round_r1.db
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1a533d4d5865529ddc5a733df7afb48b05c4704ead3df9f35cf1169e3807610
|
| 3 |
+
size 65536
|
src/eval_server.py
CHANGED
|
@@ -151,20 +151,7 @@ def app_main(args) -> None:
|
|
| 151 |
|
| 152 |
# Collapsible task guide
|
| 153 |
with gr.Accordion('Task Instructions (Click to expand)', open=False):
|
| 154 |
-
gr.Markdown(
|
| 155 |
-
'## Question 1: Relevance Score (1-5)\n'
|
| 156 |
-
'Rate how relevant the icon is to the given label on a scale of 1 to 5:\n'
|
| 157 |
-
'- **5**: Strongly related (highly consistent with the label, clear match)\n'
|
| 158 |
-
'- **4**: Moderately related (clear partial connection, overall closer to related)\n'
|
| 159 |
-
'- **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)\n'
|
| 160 |
-
'- **2**: Weakly related (some minor or indirect connection, overall closer to unrelated)\n'
|
| 161 |
-
'- **1**: Completely unrelated (no clear connection)\n'
|
| 162 |
-
'## Question 2: Keyword Presence\n'
|
| 163 |
-
'Check the 10 keywords and indicate which ones are **NOT** visible in the icon image:\n'
|
| 164 |
-
'- Select **specific keywords** that are missing from the image, OR\n'
|
| 165 |
-
'- Select **"ALL WORDS PRESENT"** if all 10 keywords are visible in the image\n'
|
| 166 |
-
'You must select at least one option (either specific missing keywords or "ALL WORDS PRESENT")'
|
| 167 |
-
)
|
| 168 |
|
| 169 |
# Relevance score
|
| 170 |
label_md = gr.Markdown(visible=False)
|
|
|
|
| 151 |
|
| 152 |
# Collapsible task guide
|
| 153 |
with gr.Accordion('Task Instructions (Click to expand)', open=False):
|
| 154 |
+
gr.Markdown(q1_instruction + '\n' + q2_instruction)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 155 |
|
| 156 |
# Relevance score
|
| 157 |
label_md = gr.Markdown(visible=False)
|
src/instuction_md.py
CHANGED
|
@@ -7,7 +7,8 @@ Every time you start evaluating, input your user ID (e.g.: janeding) in the inpu
|
|
| 7 |
|
| 8 |
q1_instruction = """
|
| 9 |
## Question 1: Relevance Score (1-5)
|
| 10 |
-
Rate how relevant the icon is to the given label on a scale of 1 to 5
|
|
|
|
| 11 |
- **5**: Strongly related (highly consistent with the label, clear match)
|
| 12 |
- **4**: Moderately related (clear partial connection, overall closer to related)
|
| 13 |
- **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)
|
|
|
|
| 7 |
|
| 8 |
q1_instruction = """
|
| 9 |
## Question 1: Relevance Score (1-5)
|
| 10 |
+
Rate how relevant the icon is to the given label on a scale of 1 to 5.
|
| 11 |
+
### Your answer should be mainly based on your first intuition, but you may adjust it after viewing the label.
|
| 12 |
- **5**: Strongly related (highly consistent with the label, clear match)
|
| 13 |
- **4**: Moderately related (clear partial connection, overall closer to related)
|
| 14 |
- **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)
|