Update README.md
Browse files
README.md
CHANGED
|
@@ -1,5 +1,10 @@
|
|
| 1 |
---
|
| 2 |
license: apache-2.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
---
|
| 4 |
|
| 5 |
# InfiGUIAgent-2B-Stage1
|
|
@@ -35,7 +40,7 @@ processor = AutoProcessor.from_pretrained("Reallm-Labs/InfiGUIAgent-2B-Stage1")
|
|
| 35 |
|
| 36 |
# Prepare inputs
|
| 37 |
img_url = "https://raw.githubusercontent.com/Reallm-Labs/InfiGUIAgent/main/images/test_img.png"
|
| 38 |
-
prompt_template = """Output the relative coordinates of the icon, widget, or text most closely related to "{instruction}" in this screenshot, in the format of "{"x": x, "y": y}", where x and y are in the positive directions of horizontal left and vertical down respectively, with the origin at the top left corner, and the range is 0-1000."""
|
| 39 |
|
| 40 |
# Download image
|
| 41 |
response = requests.get(img_url)
|
|
|
|
| 1 |
---
|
| 2 |
license: apache-2.0
|
| 3 |
+
language:
|
| 4 |
+
- en
|
| 5 |
+
base_model:
|
| 6 |
+
- Qwen/Qwen2-VL-2B-Instruct
|
| 7 |
+
pipeline_tag: image-text-to-text
|
| 8 |
---
|
| 9 |
|
| 10 |
# InfiGUIAgent-2B-Stage1
|
|
|
|
| 40 |
|
| 41 |
# Prepare inputs
|
| 42 |
img_url = "https://raw.githubusercontent.com/Reallm-Labs/InfiGUIAgent/main/images/test_img.png"
|
| 43 |
+
prompt_template = """Output the relative coordinates of the icon, widget, or text most closely related to "{instruction}" in this screenshot, in the format of \"{{\"x\": x, \"y\": y}}\", where x and y are in the positive directions of horizontal left and vertical down respectively, with the origin at the top left corner, and the range is 0-1000."""
|
| 44 |
|
| 45 |
# Download image
|
| 46 |
response = requests.get(img_url)
|