JRosenkranz commited on
Commit
793388b
1 Parent(s): 0c7b651

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -3
README.md CHANGED
@@ -40,7 +40,7 @@ _Note: For all samples, your environment must have access to cuda_
40
  #### Setup
41
 
42
  ```bash
43
- docker pull quay.io/wxpe/text-gen-server:speculative-decoding.ecd73c4
44
  docker run -d --rm --gpus all \
45
  --name my-tgis-server \
46
  -p 8033:8033 \
@@ -50,7 +50,7 @@ docker run -d --rm --gpus all \
50
  -e FLASH_ATTENTION=true \
51
  -e PAGED_ATTENTION=true \
52
  -e DTYPE_STR=float16 \
53
- quay.io/wxpe/text-gen-server:speculative-decoding.ecd73c4
54
 
55
  # check logs and wait for "gRPC server started on port 8033" and "HTTP server started on port 3000"
56
  docker logs my-tgis-server -f
@@ -58,7 +58,7 @@ docker logs my-tgis-server -f
58
  # get the client sample (Note: The first prompt will take longer as there is a warmup time)
59
  conda create -n tgis-client-env python=3.11
60
  conda activate tgis-client-env
61
- git clone --branch speculative-decoding --single-branch https://github.com/tdoublep/text-generation-inference.git
62
  cd text-generation-inference/integration_tests
63
  make gen-client
64
  pip install . --no-cache-dir
 
40
  #### Setup
41
 
42
  ```bash
43
+ docker pull quay.io/wxpe/text-gen-server:main.ee927a4
44
  docker run -d --rm --gpus all \
45
  --name my-tgis-server \
46
  -p 8033:8033 \
 
50
  -e FLASH_ATTENTION=true \
51
  -e PAGED_ATTENTION=true \
52
  -e DTYPE_STR=float16 \
53
+ quay.io/wxpe/text-gen-server:main.ee927a4
54
 
55
  # check logs and wait for "gRPC server started on port 8033" and "HTTP server started on port 3000"
56
  docker logs my-tgis-server -f
 
58
  # get the client sample (Note: The first prompt will take longer as there is a warmup time)
59
  conda create -n tgis-client-env python=3.11
60
  conda activate tgis-client-env
61
+ git clone --branch main --single-branch https://github.com/IBM/text-generation-inference.git
62
  cd text-generation-inference/integration_tests
63
  make gen-client
64
  pip install . --no-cache-dir