增加Tars
This commit is contained in:
BIN
TARS/UI-TARS/data/coordinate_process_image.png
Normal file
BIN
TARS/UI-TARS/data/coordinate_process_image.png
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 983 KiB |
BIN
TARS/UI-TARS/data/coordinate_process_image_som.png
Normal file
BIN
TARS/UI-TARS/data/coordinate_process_image_som.png
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 983 KiB |
89
TARS/UI-TARS/data/test_messages.json
Normal file
89
TARS/UI-TARS/data/test_messages.json
Normal file
File diff suppressed because one or more lines are too long
17
TARS/UI-TARS/data/test_messages_single_image.json
Normal file
17
TARS/UI-TARS/data/test_messages_single_image.json
Normal file
File diff suppressed because one or more lines are too long
72
TARS/UI-TARS/data/training_example.json
Normal file
72
TARS/UI-TARS/data/training_example.json
Normal file
@@ -0,0 +1,72 @@
|
||||
[
|
||||
{
|
||||
"role": "system",
|
||||
"content": "You are a helpful assistant.",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "user",
|
||||
"content": "You are a GUI agent. You are given a task and your action history, with screenshots. You need to perform the next action to complete the task. \n\n## Output Format\n\nAction: ...\n\n\n## Action Space\nclick(start_box='<|box_start|>(x1,y1)<|box_end|>')\nselect(start_box='<|box_start|>(x1,y1)<|box_end|>') # To expand a dropdown menu or select an item from it.\ntype(content='', start_box='<|box_start|>(x1,y1)<|box_end|>') # First click on the textbox, and then type the content.\n\n## User Instruction\nBuy a pop rock album CD from the United Kingdom that was released in 2016, is between £15 and £20 and in perfect condition.\n\n ",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(495,30)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(381,153)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(66,263)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(66,851)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "user",
|
||||
"content": "<|vision_start|><|image_pad|>...<|image_pad|><|vision_end|>",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(66,638)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "user",
|
||||
"content": "<|vision_start|><|image_pad|>...<|image_pad|><|vision_end|>",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(66,86)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "user",
|
||||
"content": "<|vision_start|><|image_pad|>...<|image_pad|><|vision_end|>",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(66,5)<|box_end|>')",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "user",
|
||||
"content": "<|vision_start|><|image_pad|>...<|image_pad|><|vision_end|>",
|
||||
"loss_mask": 0
|
||||
},
|
||||
{
|
||||
"role": "assistant",
|
||||
"content": "Action: click(start_box='<|box_start|>(293,218)<|box_end|>')",
|
||||
"loss_mask": 1
|
||||
}
|
||||
]
|
||||
Reference in New Issue
Block a user