From 7e0b75bbb856ddf062a0ee0ca491b6459726aeea Mon Sep 17 00:00:00 2001 From: lvhan028 Date: Fri, 28 Jul 2023 15:10:20 +0800 Subject: [PATCH] bump version to v0.0.2 (#177) * bump version to v0.0.2 * fix command * update installation and inference section --- README.md | 9 +++------ README_zh-CN.md | 7 ++----- lmdeploy/version.py | 2 +- 3 files changed, 6 insertions(+), 12 deletions(-) diff --git a/README.md b/README.md index 43e618af49..9b8a7c6962 100644 --- a/README.md +++ b/README.md @@ -55,9 +55,7 @@ Below are quick steps for installation: ```shell conda create -n lmdeploy python=3.10 -y conda activate lmdeploy -git clone https://github.com/InternLM/lmdeploy.git -cd lmdeploy -pip install -e . +pip install lmdeploy ``` ### Deploy InternLM @@ -83,8 +81,7 @@ python3 -m lmdeploy.serve.turbomind.deploy internlm-chat-7b /path/to/internlm-ch #### Inference by TurboMind ```shell -docker run --gpus all --rm -v $(pwd)/workspace:/workspace -it openmmlab/lmdeploy:latest \ - python3 -m lmdeploy.turbomind.chat /workspace +python -m lmdeploy.turbomind.chat ./workspace ``` ```{note} @@ -109,7 +106,7 @@ python3 -m lmdeploy.serve.client {server_ip_addresss}:33337 or webui, ```shell -python3 -m lmdeploy.app {server_ip_addresss}:33337 internlm +python3 -m lmdeploy.app {server_ip_addresss}:33337 ``` ![](https://github.com/InternLM/lmdeploy/assets/67539920/08d1e6f2-3767-44d5-8654-c85767cec2ab) diff --git a/README_zh-CN.md b/README_zh-CN.md index 3e8f27036e..620186acb3 100644 --- a/README_zh-CN.md +++ b/README_zh-CN.md @@ -54,9 +54,7 @@ TurboMind 的 output token throughput 超过 2000 token/s, 整体比 DeepSpeed ```shell conda create -n lmdeploy python=3.10 -y conda activate lmdeploy -git clone https://github.com/InternLM/lmdeploy.git -cd lmdeploy -pip install -e . +pip install lmdeploy ``` ### 部署 InternLM @@ -82,8 +80,7 @@ python3 -m lmdeploy.serve.turbomind.deploy internlm-chat-7b /path/to/internlm-ch #### 使用 turbomind 推理 ```shell -docker run --gpus all --rm -v $(pwd)/workspace:/workspace -it openmmlab/lmdeploy:latest \ - python3 -m lmdeploy.turbomind.chat /workspace +python3 -m lmdeploy.turbomind.chat ./workspace ``` ```{note} diff --git a/lmdeploy/version.py b/lmdeploy/version.py index 079f9e66d8..8960a13972 100644 --- a/lmdeploy/version.py +++ b/lmdeploy/version.py @@ -1,7 +1,7 @@ # Copyright (c) OpenMMLab. All rights reserved. from typing import Tuple -__version__ = '0.0.1' +__version__ = '0.0.2' short_version = __version__