Skip to content
4 changes: 2 additions & 2 deletions week09_compression/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ conda activate inference

# To run part with auto-gptq
pip install auto-gptq==0.7.1 accelerate==0.28.0
pip install --upgrade git+https://github.com/huggingface/transformers.git
pip install --upgrade git+https://github.com/huggingface/transformers.git@56b64bf

# To run part with Smoothquant
cd ~
Expand Down Expand Up @@ -55,4 +55,4 @@ jupyter lab --no-browser
* https://arxiv.org/abs/2206.09557
* https://arxiv.org/abs/2208.07339
* https://huggingface.co/blog/hf-bitsandbytes-integration
* https://pytorch.org/tutorials/advanced/static_quantization_tutorial.html
* https://pytorch.org/tutorials/advanced/static_quantization_tutorial.html