hailey2024 commited on
Commit
12d4c5a
·
1 Parent(s): 097d2a9

update instruction

Browse files
Files changed (3) hide show
  1. eval_round_r1.db +3 -0
  2. src/eval_server.py +1 -14
  3. src/instuction_md.py +2 -1
eval_round_r1.db ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1a533d4d5865529ddc5a733df7afb48b05c4704ead3df9f35cf1169e3807610
3
+ size 65536
src/eval_server.py CHANGED
@@ -151,20 +151,7 @@ def app_main(args) -> None:
151
 
152
  # Collapsible task guide
153
  with gr.Accordion('Task Instructions (Click to expand)', open=False):
154
- gr.Markdown(
155
- '## Question 1: Relevance Score (1-5)\n'
156
- 'Rate how relevant the icon is to the given label on a scale of 1 to 5:\n'
157
- '- **5**: Strongly related (highly consistent with the label, clear match)\n'
158
- '- **4**: Moderately related (clear partial connection, overall closer to related)\n'
159
- '- **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)\n'
160
- '- **2**: Weakly related (some minor or indirect connection, overall closer to unrelated)\n'
161
- '- **1**: Completely unrelated (no clear connection)\n'
162
- '## Question 2: Keyword Presence\n'
163
- 'Check the 10 keywords and indicate which ones are **NOT** visible in the icon image:\n'
164
- '- Select **specific keywords** that are missing from the image, OR\n'
165
- '- Select **"ALL WORDS PRESENT"** if all 10 keywords are visible in the image\n'
166
- 'You must select at least one option (either specific missing keywords or "ALL WORDS PRESENT")'
167
- )
168
 
169
  # Relevance score
170
  label_md = gr.Markdown(visible=False)
 
151
 
152
  # Collapsible task guide
153
  with gr.Accordion('Task Instructions (Click to expand)', open=False):
154
+ gr.Markdown(q1_instruction + '\n' + q2_instruction)
 
 
 
 
 
 
 
 
 
 
 
 
 
155
 
156
  # Relevance score
157
  label_md = gr.Markdown(visible=False)
src/instuction_md.py CHANGED
@@ -7,7 +7,8 @@ Every time you start evaluating, input your user ID (e.g.: janeding) in the inpu
7
 
8
  q1_instruction = """
9
  ## Question 1: Relevance Score (1-5)
10
- Rate how relevant the icon is to the given label on a scale of 1 to 5:
 
11
  - **5**: Strongly related (highly consistent with the label, clear match)
12
  - **4**: Moderately related (clear partial connection, overall closer to related)
13
  - **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)
 
7
 
8
  q1_instruction = """
9
  ## Question 1: Relevance Score (1-5)
10
+ Rate how relevant the icon is to the given label on a scale of 1 to 5.
11
+ ### Your answer should be mainly based on your first intuition, but you may adjust it after viewing the label.
12
  - **5**: Strongly related (highly consistent with the label, clear match)
13
  - **4**: Moderately related (clear partial connection, overall closer to related)
14
  - **3**: Neutral/uncertain (ambiguous, could be seen as either related or unrelated)