Smart_LLM

Running on Zero

Daemontatox commited on 20 days ago

Commit

f637502

verified ·

1 Parent(s): 547b264

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ from transformers import (
 )
 # Configuration Constants
-MODEL_ID = "Daemontatox/Phi-4-COT"
 # Understand]: Analyze the question to identify key details and clarify the goal.
@@ -139,9 +139,9 @@ h3 {
 def initialize_model():
     """Initialize the model with appropriate configurations"""
     quantization_config = BitsAndBytesConfig(
-        load_in_8bit=True,
-        bnb_8bit_compute_dtype=torch.bfloat16,
-        bnb_8bit_use_double_quant=True
     )
     tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
@@ -153,7 +153,7 @@ def initialize_model():
         torch_dtype=torch.float16,
         device_map="cuda",
         attn_implementation="flash_attention_2",
-        #quantization_config=quantization_config
     )

 )
 # Configuration Constants
+MODEL_ID = "Daemontatox/PathFinderAi3.0"
 # Understand]: Analyze the question to identify key details and clarify the goal.
 def initialize_model():
     """Initialize the model with appropriate configurations"""
     quantization_config = BitsAndBytesConfig(
+        load_in_4bit=True,
+        bnb_4bit_compute_dtype=torch.bfloat16,
+        bnb_4bit_use_double_quant=True
     )
     tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
         torch_dtype=torch.float16,
         device_map="cuda",
         attn_implementation="flash_attention_2",
+        quantization_config=quantization_config
     )