ServiceNow
/

GroundNext-7B-V0

Image-Text-to-Text

vision-language

text-generation-inference

Model card Files Files and versions

BAJUKA commited on 23 days ago

Commit

1c8864c

·

verified ·

1 Parent(s): dcc653f

Update inference code

Files changed (1) hide show

README.md +4 -2

README.md CHANGED Viewed

@@ -99,6 +99,8 @@ import torch
 from transformers import Qwen2_5_VLForConditionalGeneration, AutoTokenizer, AutoProcessor
 from PIL import Image
 import groundcua
 model_name = "ServiceNow/GroundNext-7B-V0"
@@ -120,12 +122,12 @@ model.generation_config.do_sample = False
 model.generation_config.use_cache = True
 # Load and prepare image
-url = "https://huggingface.co/datasets/ServiceNow/GroundCUA/resolve/main/images/LibreOffice Writer/00c4bac63f95985ccd9a4210fa752e8a5148a5f69ecb8bcfb3e499f5a3becc0d.png"
 image = Image.open(io.BytesIO(urlopen(url).read()))
 image, (width, height) = groundcua.prepare_image(image)
 # Create messages and generate
-instruction = "Click on the 'Save' icon"
 messages = groundcua.create_messages(instruction, image, width, height)
 input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True, tokenize=False)

 from transformers import Qwen2_5_VLForConditionalGeneration, AutoTokenizer, AutoProcessor
 from PIL import Image
 import groundcua
+import io
+from urllib.request import urlopen
 model_name = "ServiceNow/GroundNext-7B-V0"
 model.generation_config.use_cache = True
 # Load and prepare image
+url = "https://huggingface.co/datasets/ServiceNow/GroundCUA/resolve/main/images/7-Zip/001f0079a489909eb94e47c2374b7bf36ab1842e314592ce30a34d18a54eb1df.png"
 image = Image.open(io.BytesIO(urlopen(url).read()))
 image, (width, height) = groundcua.prepare_image(image)
 # Create messages and generate
+instruction = "Click on the 'File' button"
 messages = groundcua.create_messages(instruction, image, width, height)
 input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True, tokenize=False)