petals inference

pull/572/head
John Doe 1 month ago
parent 5b7e7c7375
commit c6dd015ea3

@ -2,8 +2,8 @@
Description=Petals Inference
[Service]
#User=petals
#Group=petals
User=petals
Group=petals
Environment=PJRT_DEVICE=TPU
ExecStart=/home/petals/venv/bin/python -m petals.cli.run_server --port 31330 petals-team/StableBeluga2 --device xla --num_blocks=4

Loading…
Cancel
Save