optbert

Requirements

anaconda

# 设置代理
vim ~/.bashrc
# 然后在末尾写入, 注意其中需要替换的部分{}：
    # 3090
    export HTTP_PROXY='http://10.10.20.100:1088'
    export HTTPS_PROXY='http://10.10.20.100:1089'

    # muxi
    export HTTP_PROXY='http://172.18.10.12:1089'
    export HTTPS_PROXY='http://172.18.10.12:1089'
    # replace "your name"
    torch=torch=/home/{your name}/anaconda3/envs/torch/lib/python3.8/site-packages/torch
    export PATH=$PATH:/opt/maca/mxgpu_llvm/bin:/opt/maca/bin
    export MACA_PATH=/opt/maca
    export LD_LIBRARY_PATH=/opt/maca/lib:/opt/maca/mxgpu_llvm/lib:/opt/maca/ompi/lib:$LD_LIBRARY_PATH
    export LIBTORCH_PATH=${torch}
    export LD_LIBRARY_PATH=${torch}/lib:$LD_LIBRARY_PATH
    export CMAKE_PREFIX_PATH=${torch}/share/cmake/Torch:$CMAKE_PREFIX_PATH
    export CUCC_PATH=/opt/maca/tools/cu-bridge
    export PATH=$PATH:${CUCC_PATH}/tools:${CUCC_PATH}/bin
    export CUDA_PATH=/opt/cu-bridge/CUDA_DIR
    export PATH=$PATH:${CUDA_PATH}/bin
    export CUDA_HOME=/opt/maca/tools/cu-bridge
    export LD_LIBRARY_PATH=/usr/lib/x86_64-linux-gnu:$LD_LIBRARY_PATH
    export LD_LIBRARY_PATH=/usr/local/cuda/lib64/stubs:$LD_LIBRARY_PATH

    #tianshu
    export HTTP_PROXY='http://172.18.10.12:1089'
    export HTTPS_PROXY='http://172.18.10.12:1089'
    export PATH="/usr/local/corex/bin:$PATH"
    export LD_LIBRARY_PATH="/usr/local/corex/lib:$LD_LIBRARY_PATH"
    export CPLUS_INCLUDE_PATH="$CPLUS_INCLUDE_PATH:/usr/include/x86_64-linux-gnu/c++/11/"
    export CPLUS_INCLUDE_PATH="$CPLUS_INCLUDE_PATH:/usr/include/c++/11/"
    export LD_LIBRARY_PATH=/usr/lib/gcc/x86_64-linux-gnu/11/:$LD_LIBRARY_PATH
    # replace "your name"
    export PATH="/home/{your name}/anaconda3/envs/torch/bin:$PATH"
    export CXX=x86_64-conda-linux-gnu-g++

# 保存退出后
source ~/.bashrc

# 用清华源下载会快一些，官方源下载很慢
wget -U NoSuchBrowser/1.0 https://mirrors.tuna.tsinghua.edu.cn/anaconda/archive/Anaconda3-2023.07-2-Linux-x86_64.sh
# 安装Anaconda
sh Anaconda3-2023.07-2-Linux-x86_64.sh
# 需要接受许可证
Do you accept the license terms? [yes|no]
[no] >>> yes
# 最好选择yes，否则要手动设置环境变量
Do you wish the installer to initialize Anaconda3 by running conda init? [yes|no]
[no] >>> yes
# 重新登录终端，就有conda命令了，可以查看一下版本
conda -V

# 编辑conda配置文件
vim ~/.condarc
# 将下面的代码块中的内容粘贴进去，然后清除相关缓存
channels:
    - defaults
show_channel_urls: true
default_channels:
    - https://mirrors.tuna.tsinghua.edu.cn/anaconda/pkgs/main
    - https://mirrors.tuna.tsinghua.edu.cn/anaconda/pkgs/r
    - https://mirrors.tuna.tsinghua.edu.cn/anaconda/pkgs/msys2
custom_channels:
    conda-forge: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    msys2: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    bioconda: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    menpo: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    pytorch: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    pytorch-lts: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    simpleitk: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud
    deepmodeling: https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud/
    nvidia: https://mirrors.sustech.edu.cn/anaconda-extra/cloud

conda clean -i
conda clean -p
conda clean -a

#创建test环境
conda create -n test python=3.9
conda activate test

cuda for 3090

conda install -c "nvidia/label/cuda-12.1.1" cuda-toolkit

torch

# for 3090
pip install torch

# for muxi
pip install /home/public/mxc500-2.19.2.23/wheel/torch-2.0.0+mc2.19.2.23-cp38-cp38-linux_x86_64.whl
python test/patch.py

# for tianshu
pip install /share/huangshan/torch-2.1.1+corex.4.0.0-cp39-cp39-linux_x86_64.whl

triton for tianshu

pip install /share/huangshan/triton-2.1.0+corex.4.0.0-cp39-cp39-linux_x86_64.whl

requirements
```
pip install -r requirements.txt
```

Pre-installation

lm_eval

conda install git
git clone -b v0.3.0 https://github.com/EleutherAI/lm-evaluation-harness.git
cd lm-evaluation-harness/
pip install -e .

FlexGen

cd test/baseline/FlexGen
pip install -e .

Installation

install sparse kernel

cd your GPU environment

cd sparse-attention/{your GPU environment}/

install the look up table attention "playground"
```
python setup.py install
```

install quant kernel

cd your GPU environment

cd quantization/{your GPU environment}/

install the quantization kernel "quant"
```
python setup.py install
```

test

1. Set the env variables

# if in the test machine

#nvidia or tianshu
export MODEL_OPT_PATH=/share/huangshan/opt-6.7b
export MODEL_BERT_PATH=/share/huangshan/bert-large-cased-lambada
export MODEL_LLAMA_PATH=/share/yuzhen/llama2-chinese

#muxi
export MODEL_OPT_PATH=/home/public/models/opt-6.7b
export MODEL_BERT_PATH=/home/public/models/bert-large-cased-lambada

#else
export MODEL_OPT_PATH={opt model path}
export MODEL_BERT_PATH={bert model path}
export MODEL_LLAMA_PATH={llama model path}

2. Generate quantized models

# for opt
## nvidia
CUDA_VISIBLE_DEVICES=0 python nvidia/opt_infer.py --model_path $MODEL_OPT_PATH --w_bit 4 --output_path quantized_model/opt

## muxi
CUDA_VISIBLE_DEVICES=0 python muxi/opt_infer.py --model_path $MODEL_OPT_PATH --w_bit 4 --w_group_size 64 --output_path quantized_model/opt --rep_file /home/public/rep_file/facebook_opt-6.7b-smooth.pt

## tianshu
CUDA_VISIBLE_DEVICES=0 python tianshu/opt_infer.py --model_path $MODEL_OPT_PATH --w_bit 4 --w_group_size 64 --output_path quantized_model/opt --rep_file /share/huangshan/rep_file/facebook_opt-6.7b-smooth.pt

# for bert
## nvidia
CUDA_VISIBLE_DEVICES=0 python nvidia/bert_infer.py --model_path $MODEL_BERT_PATH --w_bit 4 --output_path quantized_model/bert

## muxi
CUDA_VISIBLE_DEVICES=0 python muxi/bert_infer.py --model_path $MODEL_BERT_PATH --w_bit 4 --w_group_size 64 --output_path quantized_model/bert

## tianshu
CUDA_VISIBLE_DEVICES=0 python tianshu/bert_infer.py --model_path $MODEL_BERT_PATH --w_bit 4 --w_group_size 64 --output_path quantized_model/bert

# for llama
CUDA_VISIBLE_DEVICES=0 python nvidia/llama_infer.py --model_path $MODEL_LLAMA_PATH --w_bit 4 --output_path quantized_model/llama

3. Now you can start your test using

bash {your_expected}.sh

if you want to choose which sentences to sample

bash {your_expected}_support_{your_env}.sh --sample {Sequence number separated by blank space, e.g., 0 2 4 8 9}

Name		Name	Last commit message	Last commit date
Latest commit History 85 Commits
quantization		quantization
sparse-attention		sparse-attention
test		test
.gitignore		.gitignore
README.md		README.md
download_llama_model.py		download_llama_model.py
requirements.txt		requirements.txt

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Repository files navigation

optbert

Requirements

Pre-installation

Installation

install sparse kernel

install quant kernel

test

1. Set the env variables

2. Generate quantized models

3. Now you can start your test using

About

Releases

Packages

Contributors 2

Languages

sparklesea/sparse-quant

Folders and files

Latest commit

History

Repository files navigation

optbert

Requirements

Pre-installation

Installation

install sparse kernel

install quant kernel

test

1. Set the env variables

2. Generate quantized models

3. Now you can start your test using

About

Resources

Stars

Watchers

Forks

Releases

Packages 0

Contributors 2

Languages

Packages