From 5deffc02ba85eb1b15965d34c071ddf988b73241 Mon Sep 17 00:00:00 2001 From: "cuiqing.li" Date: Mon, 30 Oct 2023 14:33:59 +0800 Subject: [PATCH 1/2] update doc --- colossalai/inference/README.md | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/colossalai/inference/README.md b/colossalai/inference/README.md index 4aca7aeb0582..1d663a42be59 100644 --- a/colossalai/inference/README.md +++ b/colossalai/inference/README.md @@ -59,16 +59,14 @@ dependencies pytorch= 1.13.1 (gpu) cuda>= 11.6 transformers= 4.30.2 -triton==2.0.0.dev20221202 -# for install vllm, please use this branch to install https://github.com/tiandiao123/vllm/tree/setup_branch -vllm +triton # for install flash-attention, please use commit hash: 67ae6fd74b4bc99c36b2ce524cf139c35663793c flash-attention # install lightllm since we depend on lightllm triton kernels git clone https://github.com/ModelTC/lightllm -git checkout 28c1267cfca536b7b4f28e921e03de735b003039 cd lightllm +git checkout 28c1267cfca536b7b4f28e921e03de735b003039 pip3 install -e . # also, install xformers from source: @@ -93,8 +91,8 @@ pip install -e . # install lightllm git clone https://github.com/ModelTC/lightllm -git checkout 28c1267cfca536b7b4f28e921e03de735b003039 cd lightllm +git checkout 28c1267cfca536b7b4f28e921e03de735b003039 pip3 install -e . # install xformers from source From e139f8eeb843a1e875ed0e95d27f6029ff998e84 Mon Sep 17 00:00:00 2001 From: Cuiqing Li Date: Mon, 30 Oct 2023 17:00:39 +0800 Subject: [PATCH 2/2] Update README.md --- colossalai/inference/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/colossalai/inference/README.md b/colossalai/inference/README.md index 1d663a42be59..cf5dbf245205 100644 --- a/colossalai/inference/README.md +++ b/colossalai/inference/README.md @@ -60,7 +60,7 @@ pytorch= 1.13.1 (gpu) cuda>= 11.6 transformers= 4.30.2 triton -# for install flash-attention, please use commit hash: 67ae6fd74b4bc99c36b2ce524cf139c35663793c +# for install flash-attention flash-attention # install lightllm since we depend on lightllm triton kernels