Spaces:

RPW
/

NIH1.2_Llama3.2

Runtime error

RPW commited on Dec 16, 2024

Commit

e7993e4

verified ·

1 Parent(s): 37c32fd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
-from transformers import RobertaTokenizer, RobertaForSequenceClassification
 import torch
 # Define the model path
 MODEL_NAME = "RPW/NIH-1.2_Llama-3.2-11B-Vision-Instruct"
 device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -7,16 +8,26 @@ device = "cuda" if torch.cuda.is_available() else "cpu"
 instruction = "You are an expert radiographer. Describe accurately what you see in this image."
 # Load the tokenizer and model
-tokenizer = RobertaTokenizer.from_pretrained(MODEL_NAME)
-model = RobertaForSequenceClassification.from_pretrained(MODEL_NAME).to(device)
 input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
 inputs = tokenizer(
     image,
     input_text,
     add_special_tokens=False,
-    return_tensors="pt").to("cuda")
 text_streamer = TextStreamer(tokenizer, skip_prompt=True)
-_ = model.generate(**inputs, streamer=text_streamer, max_new_tokens=128,
-                   use_cache=True, temperature=1.5, min_p=0.1)

+from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch
 # Define the model path
 MODEL_NAME = "RPW/NIH-1.2_Llama-3.2-11B-Vision-Instruct"
 device = "cuda" if torch.cuda.is_available() else "cpu"
 instruction = "You are an expert radiographer. Describe accurately what you see in this image."
 # Load the tokenizer and model
+tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
+model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME).to(device)
+# Example of messages
+messages = [{"role": "system", "content": instruction}]
 input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
 inputs = tokenizer(
     image,
     input_text,
     add_special_tokens=False,
+    return_tensors="pt"
+).to(device)
 text_streamer = TextStreamer(tokenizer, skip_prompt=True)
+_ = model.generate(
+    **inputs,
+    streamer=text_streamer,
+    max_new_tokens=128,
+    use_cache=True,
+    temperature=1.5,
+    min_p=0.1
+)