Update app.py
Browse files
app.py
CHANGED
@@ -37,9 +37,9 @@ def load_quantized_model(model_id=None):
|
|
37 |
)
|
38 |
kwargs = {
|
39 |
'model_path': model_path,
|
40 |
-
'n_ctx':
|
41 |
-
'max_tokens':
|
42 |
-
'n_batch':
|
43 |
# 'n_gpu_layers':6,
|
44 |
}
|
45 |
return llamacpp.LlamaCpp(**kwargs)
|
|
|
37 |
)
|
38 |
kwargs = {
|
39 |
'model_path': model_path,
|
40 |
+
'n_ctx': 20000,
|
41 |
+
'max_tokens': 15000,
|
42 |
+
'n_batch': 1024,
|
43 |
# 'n_gpu_layers':6,
|
44 |
}
|
45 |
return llamacpp.LlamaCpp(**kwargs)
|