Spaces:

RPW
/

NIH1.2_Llama3.2

Runtime error

RPW commited on Dec 16, 2024

Commit

37c32fd

verified ·

1 Parent(s): 6de0aed

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,17 +4,19 @@ import torch
 MODEL_NAME = "RPW/NIH-1.2_Llama-3.2-11B-Vision-Instruct"
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Load the tokenizer and model
 tokenizer = RobertaTokenizer.from_pretrained(MODEL_NAME)
 model = RobertaForSequenceClassification.from_pretrained(MODEL_NAME).to(device)
-# Example usage: Tokenizing some input text
-input_text = "Describe this image."
-inputs = tokenizer(input_text, return_tensors="pt").to(device)
-# Generating output
-outputs = model(**inputs)
-logits = outputs.logits
-# ใช้ softmax หรือการแปลงค่าอื่นๆ ถ้าต้องการผลลัพธ์ที่เหมาะสมกับการ classification
-print(logits)

 MODEL_NAME = "RPW/NIH-1.2_Llama-3.2-11B-Vision-Instruct"
 device = "cuda" if torch.cuda.is_available() else "cpu"
+instruction = "You are an expert radiographer. Describe accurately what you see in this image."
 # Load the tokenizer and model
 tokenizer = RobertaTokenizer.from_pretrained(MODEL_NAME)
 model = RobertaForSequenceClassification.from_pretrained(MODEL_NAME).to(device)
+input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
+inputs = tokenizer(
+    image,
+    input_text,
+    add_special_tokens=False,
+    return_tensors="pt").to("cuda")
+text_streamer = TextStreamer(tokenizer, skip_prompt=True)
+_ = model.generate(**inputs, streamer=text_streamer, max_new_tokens=128,
+                   use_cache=True, temperature=1.5, min_p=0.1)