added setup.sh and added .env.example

4 weeks ago · 5744205357
parent a13e0986f5
commit 5744205357
5 changed files with 25 additions and 127 deletions
--- a/.env.example
+++ b/.env.example
@ -0,0 +1,3 @@
+INITIAL_PEERS=
+DEVICE=CUDA
+MODEL=meta-llama/Meta-Llama-8B-Instruct
--- a/docker-compose.yml
+++ b/docker-compose.yml
@ -1,53 +1,19 @@
 services:
  backbone:
    profiles: ["core"]
-    image: h4ckermike/petals:main
+    image:  h4ckermike/petals:main
    command: python -m petals.cli.run_dht --host_maddrs /ip4/0.0.0.0/tcp/8008 --identity_path /cache/bootstrap1.id
    volumes:
      - petals-cache-backbone:/cache
    network_mode: host
    ipc: host
    restart: unless-stopped
-    
-  health:
-    profiles: ["core"]
-    restart: always
-    depends_on:
-     - backbone
-    image: h4ckermike/health.petals:main
-    ports:
-      - "8009:5000"
-    command: flask run --host=0.0.0.0 --port=5000

-  tinyllama_local_gpu:
-    profiles: ["local","gpu"]
-   #    image: h4ckermike/petals:main
-    build : .
-    depends_on:
-       - backbone
-    ports:
-      - "31336:31336"
-    command: python -m petals.cli.run_server --port 31336  --num_blocks=1 Maykeye/TinyLLama-v0 --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 1
-              capabilities: [gpu]
-    restart: always
-
-#
  envmodel_local_gpu:
    profiles: ["local","gpu"]
    build: .
    environment:
      - MODEL=${MODEL}
-    depends_on:
-       - backbone
-       # xai-org/grok-1
-       # hpcai-tech/grok-1
-       # keyfan/grok-1-hf
    command: python -m petals.cli.run_server --port 31331  --num_blocks=1  $MODEL  --initial_peers $INITIAL_PEERS  --device=$DEVICE
    ports:
      - "31331:31331"
@ -60,95 +26,5 @@ services:
              count: 1
              capabilities: [gpu]

-  tinymixtral_local_gpu:
-    profiles: ["local","gpu"]
-    build: .
-    depends_on:
-       - backbone
-    command: python -m petals.cli.run_server --port 31331  --num_blocks=1 SanjiWatsuki/TinyMixtral-32x248M  --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    ports:
-      - "31331:31331"
-    restart: always
-
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 1
-              capabilities: [gpu]
-
-  tinyllama_local_cpu:
-    profiles: ["local","cpu"]
-    build: .
-    depends_on:
-       - backbone
-    command: python -m petals.cli.run_server --port 31331  --num_blocks=1 Maykeye/TinyLLama-v0 --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    ports:
-      - "31331:31331"
-    restart: always
-
-    
-  tinyllamacpu:
-    profiles: ["tinyllama","cpu"]
-    image: h4ckermike/petals:main
-    depends_on:
-       - backbone
-    command: python -m petals.cli.run_server --port 31331  --num_blocks=1 Maykeye/TinyLLama-v0 --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    ports:
-      - "31331:31331"
-    restart: always
-
-    
-  tinyllamagpu:
-    profiles: ["core"]
-    image: h4ckermike/petals:main
-    depends_on:
-       - backbone
-    ports:
-      - "31332:31332"
-    command: python -m petals.cli.run_server --port 31332  --num_blocks=100 Maykeye/TinyLLama-v0 --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 1
-              capabilities: [gpu]
-    restart: always
-
-    
-  tinyllamatpu:
-    profiles: ["tpu"]
-    image: h4ckermike/petals:main
-    depends_on:
-       - backbone
-    ports:
-      - "31333:31333"
-    command: python -m petals.cli.run_server --port 31333  --num_blocks=1 Maykeye/TinyLLama-v0 --initial_peers $INITIAL_PEERS  --device=$DEVICE
-    restart: always
-
-
-  debug_health:
-    profiles: ["debug"]
-
-    image: h4ckermike/health.petals:main
-    command: bash
-    stdin_open: true
-    tty: true
-
-  inference   :
-    profiles: ["core"]
-    restart: always
-    depends_on:
-      - backbone
-    image: h4ckermike/inference.petals:main
-#    image: petals-inference-test
-    ports:
-      - "8010:5000"
-
-    command: gunicorn app:app --bind 0.0.0.0:5000 --worker-class gthread --threads 100 --timeout 1000
-
-
 volumes:
  petals-cache-backbone:
--- a/envs/gpu/h100/peers.txt
+++ b/envs/gpu/h100/peers.txt
@ -1 +1 @@
-/ip4/216.81.245.26/tcp/8099/p2p/QmR4PcZvHg414Q2HNEaQZLiu69HD4Vs17hcwDgq8qJdJq2
+INITIAL_PEERS=/dns/dht1.cillium.dev.compute.agentartificial.com/tcp/8008/p2p/Qmb3skfrki1PR8ww6nxvoGm51F5imK3e1DPMZgtay6ofE2
--- a/get_peersl.sh
+++ b/get_peersl.sh
@ -1 +1 @@
-docker logs petals-backbone-1 2>&1  |grep initial_peers |cut "-d " -f18-  | sort -u > peers.txt
+docker logs petals-backbone-1 2>&1  | grep initial_peers | cut "-d " -f18-  | sort -u > peers.txt
--- a/setup.sh
+++ b/setup.sh
@ -0,0 +1,19 @@
+#!/bin/bash
+
+set -e
+
+if [ -z "$INITIAL_PEERS" ]; then
+    INITIAL_PEERS=cat envs/gpu/h100/peers.txt
+fi
+
+cat env.example > .env
+sed -i "s/INITIAL_PEERS=.*/INITIAL_PEERS=$INITIAL_PEERS/" .env
+
+python -m venv .venv
+source .venv/bin/activate
+python -m pip install --upgrade pip
+
+pip install setuptools wheel gnureadline
+pip install -e .
+
+docker compose --profile core --env-file .env up -d