From b7f4a2537e0d6f36655755979d308de56c52cf53 Mon Sep 17 00:00:00 2001
From: kyy <b24053@hanmaceng.co.kr>
Date: Thu, 23 Oct 2025 17:51:10 +0900
Subject: [PATCH] DeepSeek-OCR-vllm: update INPUT_PATH & Dockerfile envs

---
 .gitignore                                    |  9 +++++
 .../DeepSeek-OCR-vllm/config.py               |  4 +--
 Dockerfile.vllm                               | 36 +++++++++----------
 3 files changed, 27 insertions(+), 22 deletions(-)
 create mode 100644 .gitignore
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..54b53fd
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,9 @@
+# Cache directories
+.cache/
+__pycache__/
+
+# Output directory
+output/
+
+# PDF files
+*.pdf
diff --git a/DeepSeek-OCR-master/DeepSeek-OCR-vllm/config.py b/DeepSeek-OCR-master/DeepSeek-OCR-vllm/config.py
index 37e48a1..8954cbd 100644
--- a/DeepSeek-OCR-master/DeepSeek-OCR-vllm/config.py
+++ b/DeepSeek-OCR-master/DeepSeek-OCR-vllm/config.py
@@ -21,9 +21,7 @@ MODEL_PATH = 'deepseek-ai/DeepSeek-OCR' # change to your model path
 # .jpg, .png, .jpeg: run_dpsk_ocr_image.py; 
 # Omnidocbench images path: run_dpsk_ocr_eval_batch.py
 
-FILE_NAME='2025-27484-M21472.pdf'
-
-INPUT_PATH = f'/workspace/2025-27484-M21472.pdf' 
+INPUT_PATH = f'/workspace/2018-0802140959-217049.pdf' 
 OUTPUT_PATH = '/workspace/output/'
 
 PROMPT = '<image>\n<|grounding|>Convert the document to markdown.'
diff --git a/Dockerfile.vllm b/Dockerfile.vllm
index dac8525..745d230 100644
--- a/Dockerfile.vllm
+++ b/Dockerfile.vllm
@@ -1,41 +1,39 @@
 # PyTorch 2.6.0 + CUDA 12.6 + cuDNN9
 FROM pytorch/pytorch:2.6.0-cuda12.6-cudnn9-devel
 
-# 기본 환경 변수
+# 기본 환경 변수 설정
 ENV DEBIAN_FRONTEND=noninteractive \
     HF_HOME=/workspace/.cache/huggingface \
     CUDA_HOME=/usr/local/cuda \
     LD_LIBRARY_PATH=/usr/local/cuda/lib64:${LD_LIBRARY_PATH} \
     PIP_DISABLE_PIP_VERSION_CHECK=1 \
-    PYTHONUNBUFFERED=1
+    PYTHONUNBUFFERED=1 \
+    TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas \
+    TORCH_CUDA_ARCH_LIST="8.0"
 
 WORKDIR /workspace
 
-# 필수 빌드 도구
+# 필수 빌드 도구 설치
 RUN apt-get update && apt-get install -y --no-install-recommends \
       git build-essential ninja-build \
     && rm -rf /var/lib/apt/lists/*
 
-# pip 툴업
-RUN python -m pip install -U pip setuptools wheel packaging ninja
+# pip 업그레이드
+RUN python -m pip install -U pip setuptools wheel
 
-# (베이스 이미지에 torch 2.6.0이 이미 포함)
-# torchvision/torchaudio 버전을 보장하려면 아래 라인을 사용하세요.
-# cu126 인덱스가 없을 수 있으므로 실패해도 빌드가 계속되게 처리합니다.
-RUN pip install --no-cache-dir \
-      torchvision==0.21.0 torchaudio==2.6.0 \
-      --extra-index-url https://download.pytorch.org/whl/cu126 || \
-    echo "Skip reinstalling torchvision/torchaudio (fallback to base image)"
+# 기존 라이브러리 제거 및 특정 버전 재설치
+RUN pip uninstall -y vllm torch torchvision torchaudio triton flash-attn || true
+RUN pip install torch==2.6.0 torchvision==0.21.0 torchaudio==2.6.0
 
 # 프로젝트 의존성 설치
 COPY requirements.txt /tmp/requirements.txt
-RUN pip install --no-cache-dir -r /tmp/requirements.txt
+RUN pip install -r /tmp/requirements.txt
 
-# vLLM 0.8.5 고정 (CUDA 12.x용 wheel 자동 선택)
-RUN pip install --no-cache-dir vllm==0.8.5
+# vLLM 특정 버전 설치
+RUN pip install vllm==0.8.5
 
-# FlashAttention (CUDA 12.6에서 빌드)
-RUN pip install --no-cache-dir flash-attn==2.7.3 --no-build-isolation
+# FlashAttention 소스에서 빌드하여 설치
+RUN pip cache purge && \
+    pip install --no-cache-dir --no-build-isolation --no-binary=flash-attn flash-attn==2.7.3
 
-# 작업 디렉터리 유지
-WORKDIR /workspace
+WORKDIR /workspace
\ No newline at end of file