mirror of
https://github.com/kou029w/_.git
synced 2025-01-30 22:08:02 +00:00
add bitnet
This commit is contained in:
parent
3ef34e52e2
commit
876d84fb75
1 changed files with 14 additions and 0 deletions
14
bitnet/Dockerfile
Normal file
14
bitnet/Dockerfile
Normal file
|
@ -0,0 +1,14 @@
|
||||||
|
FROM python:3.9-alpine
|
||||||
|
RUN apk add --no-cache build-base cmake clang git && \
|
||||||
|
rm -rf /var/cache/apk/*
|
||||||
|
RUN git clone --recursive --depth 1 https://github.com/microsoft/BitNet.git && \
|
||||||
|
rm -rf BitNet/.git
|
||||||
|
WORKDIR /BitNet
|
||||||
|
RUN pip install -r requirements.txt && \
|
||||||
|
pip cache purge
|
||||||
|
RUN python3 utils/codegen_tl2.py --model Llama3-8B-1.58-100B-tokens --BM 256,128,256,128 --BK 96,96,96,96 --bm 32,32,32,32
|
||||||
|
RUN cmake -B build -DBITNET_X86_TL2=ON -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++
|
||||||
|
RUN cmake --build build --target llama-cli --config Release
|
||||||
|
ADD https://huggingface.co/brunopio/Llama3-8B-1.58-100B-tokens-GGUF/resolve/main/Llama3-8B-1.58-100B-tokens-TQ2_0.gguf .
|
||||||
|
RUN echo "2565559c82a1d03ecd1101f536c5e99418d07e55a88bd5e391ed734f6b3989ac Llama3-8B-1.58-100B-tokens-TQ2_0.gguf" | sha256sum -c
|
||||||
|
CMD ["python3", "run_inference.py", "-m", "Llama3-8B-1.58-100B-tokens-TQ2_0.gguf", "-p", "The sky is blue due to a phenomenon called"]
|
Loading…
Add table
Reference in a new issue