Spaces:
Paused
Paused
Update Dockerfile
Browse files- Dockerfile +7 -34
Dockerfile
CHANGED
|
@@ -83,38 +83,18 @@ RUN pip install --index-url https://download.pytorch.org/whl/cu128 \
|
|
| 83 |
# ---------------- Toolchain, Triton, FA2 (sem bnb) ----------------
|
| 84 |
RUN pip install packaging ninja cmake pybind11 scikit-build cython hf_transfer numpy==1.24.4
|
| 85 |
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
# ---------------- Toolchain base ----------------
|
| 89 |
-
RUN pip install packaging ninja cmake pybind11 scikit-build cython hf_transfer numpy==1.24.4
|
| 90 |
-
|
| 91 |
-
# ---------------- Instalação via wheels (HF Hub) ----------------
|
| 92 |
-
# Triton, Apex e Q8 pré-compilados (Python 3.10, manylinux x86_64)
|
| 93 |
-
# Use sempre --no-cache-dir e --no-build-isolation para evitar recompilar
|
| 94 |
RUN pip uninstall -y triton || true && \
|
| 95 |
-
pip install
|
| 96 |
-
https://huggingface.co/carlex3321/aduc-sdr/resolve/main/triton-3.5.0%2Bgit51021fb2-cp310-cp310-linux_x86_64.whl && \
|
| 97 |
-
pip install --no-cache-dir --no-build-isolation \
|
| 98 |
-
https://huggingface.co/carlex3321/aduc-sdr/resolve/main/apex-0.1-cp310-cp310-linux_x86_64.whl
|
| 99 |
-
#pip install --no-cache-dir --no-build-isolation \
|
| 100 |
-
# https://huggingface.co/carlex3321/aduc-sdr/resolve/main/q8_kernels-0.0.5-cp310-cp310-linux_x86_64.whl
|
| 101 |
-
|
| 102 |
-
# ---------------- FlashAttention 2.8.x ----------------
|
| 103 |
-
# Mantém fallback em cascata caso a versão mais nova falhe
|
| 104 |
-
RUN pip install --no-cache-dir flash-attn==2.8.3 --no-build-isolation || \
|
| 105 |
-
pip install --no-cache-dir flash-attn==2.8.2 --no-build-isolation || \
|
| 106 |
-
pip install --no-cache-dir flash-attn==2.8.1 --no-build-isolation || \
|
| 107 |
-
pip install --no-cache-dir flash-attn==2.8.0.post2 --no-build-isolation
|
| 108 |
-
|
| 109 |
|
| 110 |
# FlashAttention 2.8.x
|
| 111 |
-
RUN pip install flash-attn==2.8.3 --no-build-isolation || \
|
| 112 |
-
pip install flash-attn==2.8.2 --no-build-isolation || \
|
| 113 |
-
pip install flash-attn==2.8.1 --no-build-isolation || \
|
| 114 |
-
pip install flash-attn==2.8.0.post2 --no-build-isolation
|
| 115 |
|
| 116 |
# Diffusers/Transformers estáveis (sem dev)
|
| 117 |
-
RUN pip install --no-cache-dir transformers==4.44.2 accelerate==0.34.2 omegaconf==2.3.0
|
| 118 |
|
| 119 |
# Opcional: seu fork de otimizações
|
| 120 |
RUN pip install -U git+https://github.com/carlex22/diffusers-aduc-sdr
|
|
@@ -138,12 +118,6 @@ COPY requirements.txt ./requirements.txt
|
|
| 138 |
RUN pip install --no-cache-dir -r requirements.txt
|
| 139 |
|
| 140 |
|
| 141 |
-
RUN apt-get update && apt-get install -y \
|
| 142 |
-
build-essential clang lld cmake ninja-build git python3-dev \
|
| 143 |
-
&& rm -rf /var/lib/apt/lists/*
|
| 144 |
-
ENV CC=clang CXX=clang++ LD=lld
|
| 145 |
-
|
| 146 |
-
|
| 147 |
RUN pip install --upgrade bitsandbytes
|
| 148 |
|
| 149 |
# Scripts e configs
|
|
@@ -170,7 +144,6 @@ ENV TRANSFORMERS_CACHE=/data/.cache/transformers
|
|
| 170 |
ENV DIFFUSERS_CACHE=/data/.cache/diffusers
|
| 171 |
|
| 172 |
|
| 173 |
-
|
| 174 |
# ---------------- Entry ----------------
|
| 175 |
ENTRYPOINT ["./start.sh"]
|
| 176 |
CMD ["gradio"]
|
|
|
|
| 83 |
# ---------------- Toolchain, Triton, FA2 (sem bnb) ----------------
|
| 84 |
RUN pip install packaging ninja cmake pybind11 scikit-build cython hf_transfer numpy==1.24.4
|
| 85 |
|
| 86 |
+
# Triton 3.x (sem triton.ops)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 87 |
RUN pip uninstall -y triton || true && \
|
| 88 |
+
pip install -v --no-build-isolation triton==3.4.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 89 |
|
| 90 |
# FlashAttention 2.8.x
|
| 91 |
+
#RUN pip install flash-attn==2.8.3 --no-build-isolation || \
|
| 92 |
+
# pip install flash-attn==2.8.2 --no-build-isolation || \
|
| 93 |
+
# pip install flash-attn==2.8.1 --no-build-isolation || \
|
| 94 |
+
# pip install flash-attn==2.8.0.post2 --no-build-isolation
|
| 95 |
|
| 96 |
# Diffusers/Transformers estáveis (sem dev)
|
| 97 |
+
RUN pip install --no-cache-dir diffusers==0.31.0 transformers==4.44.2 accelerate==0.34.2 omegaconf==2.3.0
|
| 98 |
|
| 99 |
# Opcional: seu fork de otimizações
|
| 100 |
RUN pip install -U git+https://github.com/carlex22/diffusers-aduc-sdr
|
|
|
|
| 118 |
RUN pip install --no-cache-dir -r requirements.txt
|
| 119 |
|
| 120 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 121 |
RUN pip install --upgrade bitsandbytes
|
| 122 |
|
| 123 |
# Scripts e configs
|
|
|
|
| 144 |
ENV DIFFUSERS_CACHE=/data/.cache/diffusers
|
| 145 |
|
| 146 |
|
|
|
|
| 147 |
# ---------------- Entry ----------------
|
| 148 |
ENTRYPOINT ["./start.sh"]
|
| 149 |
CMD ["gradio"]
|