Update app.py
Browse files
app.py
CHANGED
|
@@ -134,6 +134,7 @@ tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
|
| 134 |
model = AutoModelForCausalLM.from_pretrained(
|
| 135 |
MODEL_ID,
|
| 136 |
device_map="auto",
|
|
|
|
| 137 |
quantization_config=quantization_config,
|
| 138 |
attn_implementation="flash_attention_2",
|
| 139 |
)
|
|
|
|
| 134 |
model = AutoModelForCausalLM.from_pretrained(
|
| 135 |
MODEL_ID,
|
| 136 |
device_map="auto",
|
| 137 |
+
low_cpu_mem_usage=True,
|
| 138 |
quantization_config=quantization_config,
|
| 139 |
attn_implementation="flash_attention_2",
|
| 140 |
)
|