mirror of
https://github.com/OneUptime/oneuptime.git
synced 2026-04-06 00:32:12 +02:00
enable gpu on llama docker
This commit is contained in:
@@ -13,6 +13,14 @@ docker build -t llama . -f ./Llama/Dockerfile
|
||||
|
||||
## Run
|
||||
|
||||
### For Linux
|
||||
|
||||
```
|
||||
docker run --gpus all -p 8547:8547 -it -v ./Llama/Models:/app/Models llama
|
||||
```
|
||||
|
||||
### For MacOS
|
||||
|
||||
```
|
||||
docker run -p 8547:8547 -it -v ./Llama/Models:/app/Models llama
|
||||
```
|
||||
|
||||
@@ -15,7 +15,8 @@ tokenizer = AutoTokenizer.from_pretrained(model_path, local_files_only=True)
|
||||
pipeline = transformers.pipeline(
|
||||
"text-generation",
|
||||
model=model_path,
|
||||
torch_dtype=torch.float32,
|
||||
# torch_dtype=torch.float32, # for CPU
|
||||
torch_dtype=torch.float16, # for GPU
|
||||
device_map="auto",
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user