Spaces:
Running
Running
Update rag_engine.py
Browse files- rag_engine.py +1 -1
rag_engine.py
CHANGED
|
@@ -54,7 +54,7 @@ def cached_load_model():
|
|
| 54 |
tokenizer = AutoTokenizer.from_pretrained(embedding_model)
|
| 55 |
model = AutoModel.from_pretrained(
|
| 56 |
embedding_model,
|
| 57 |
-
torch_dtype=torch.
|
| 58 |
)
|
| 59 |
|
| 60 |
# Move model to CPU and set to eval mode for inference
|
|
|
|
| 54 |
tokenizer = AutoTokenizer.from_pretrained(embedding_model)
|
| 55 |
model = AutoModel.from_pretrained(
|
| 56 |
embedding_model,
|
| 57 |
+
torch_dtype=torch.bfloat16
|
| 58 |
)
|
| 59 |
|
| 60 |
# Move model to CPU and set to eval mode for inference
|