# Model settings device = "cuda" model_name = "google/paligemma2-3b-ft-docci-448" # Decoding settings sampling = True