This commit is contained in:
hiondal
2025-06-15 13:52:26 +00:00
commit 6a5c411800
53 changed files with 15785 additions and 0 deletions
+100
View File
@@ -0,0 +1,100 @@
# deployment/container/Dockerfile
# Poetry 기반 Vector DB API Service Image - PVC 마운트 충돌 해결
# Base Image에서 상속 (Poetry 환경 포함)
ARG BASE_IMAGE=vector-api-base:latest
FROM ${BASE_IMAGE}
# 메타데이터
LABEL maintainer="admin@example.com"
LABEL version="1.0.2"
LABEL description="Vector DB API Service with Poetry - PVC Mount Fixed"
# 환경 변수 설정 - Poetry 가상환경 경로 유지
ENV HOME=/home/appuser \
PYTHONDONTWRITEBYTECODE=1 \
PYTHONUNBUFFERED=1 \
POETRY_VENV_IN_PROJECT=false \
POETRY_VIRTUALENVS_CREATE=true \
POETRY_VIRTUALENVS_PATH=/opt/pypoetry/venvs \
POETRY_CACHE_DIR=/opt/pypoetry/cache \
POETRY_NO_INTERACTION=1 \
PATH="/home/appuser/.local/bin:/opt/pypoetry/venvs/vector-api/bin:/usr/local/bin:/usr/bin:/bin"
# root로 전환 (파일 복사 및 권한 설정용)
USER root
# 🔧 Poetry 설정 파일들 복사 (의존성 정보)
COPY pyproject.toml poetry.lock* /app/
# 🚀 애플리케이션 소스 코드 복사
COPY app/ /app/app/
# 📦 Poetry 의존성 설치 (가상환경이 /opt에 생성됨)
RUN cd /app && \
# Poetry 설정 확인 및 재설정
poetry config virtualenvs.in-project false && \
poetry config virtualenvs.create true && \
poetry config virtualenvs.path /opt/pypoetry/venvs && \
poetry config cache-dir /opt/pypoetry/cache && \
echo "🔧 Poetry 설정 확인:" && \
poetry config --list && \
echo "📦 의존성 설치 시작..." && \
poetry install --no-dev --no-interaction && \
echo "✅ 의존성 설치 완료" && \
# 설치된 패키지 확인
poetry show | head -10 && \
# 가상환경 위치 확인
poetry env info && \
# 캐시 정리
rm -rf $POETRY_CACHE_DIR/cache && \
rm -rf /tmp/*
# 📁 데이터 디렉토리 생성 및 권한 설정
RUN mkdir -p /app/data /app/logs /app/vectordb \
&& chmod -R 755 /app/data /app/logs /app/vectordb
# 👤 사용자 및 권한 설정
RUN if id "appuser" &>/dev/null; then \
chown -R appuser:appuser /app; \
chown -R appuser:appuser /opt/pypoetry; \
else \
echo "appuser가 없어서 root로 실행됩니다"; \
fi
# 🔧 실행 스크립트 생성 (Poetry 가상환경 자동 활성화)
RUN cat > /app/start.sh << 'EOF'
#!/bin/bash
echo "🚀 Vector API 시작 중..."
echo "📍 현재 디렉토리: $(pwd)"
echo "🐍 Python 위치: $(which python)"
echo "📦 Poetry 위치: $(which poetry)"
echo "🔧 Poetry 가상환경 정보:"
poetry env info
echo "📋 설치된 패키지 (일부):"
poetry show | head -5
echo "🔍 dotenv 모듈 테스트:"
poetry run python -c "from dotenv import load_dotenv; print('✅ dotenv 모듈 정상 로드')"
echo "🚀 애플리케이션 실행..."
exec poetry run python app/main.py
EOF
RUN chmod +x /app/start.sh && \
chown appuser:appuser /app/start.sh
# 🏥 헬스체크 (의존성 확인 포함)
HEALTHCHECK --interval=30s --timeout=15s --start-period=60s --retries=3 \
CMD poetry run python -c "from dotenv import load_dotenv; import app.main; print('✅ 앱 헬스체크 성공')" || exit 1
# 🚀 포트 노출
EXPOSE 8000
# 📁 작업 디렉토리 설정
WORKDIR /app
# 👤 실행 사용자 설정
USER appuser
# 🎯 애플리케이션 실행 - 스크립트 사용
CMD ["/app/start.sh"]
+138
View File
@@ -0,0 +1,138 @@
# deployment/container/Dockerfile-base
# Poetry 기반 Vector DB API Base Image - 홈 디렉토리 사용 (안전한 방식)
FROM python:3.11-slim
# 메타데이터
LABEL description="Vector DB API Base Image with Poetry - Home Directory"
LABEL version="poetry-home-v1.0"
LABEL maintainer="admin@example.com"
# 환경 변수 설정 - Poetry 가상환경을 홈 디렉토리로 이동
ENV PYTHONDONTWRITEBYTECODE=1 \
PYTHONUNBUFFERED=1 \
DEBIAN_FRONTEND=noninteractive \
PIP_NO_CACHE_DIR=1 \
PIP_DISABLE_PIP_VERSION_CHECK=1 \
POETRY_NO_INTERACTION=1 \
POETRY_VENV_IN_PROJECT=false \
POETRY_VIRTUALENVS_CREATE=true \
POETRY_VIRTUALENVS_PATH=/home/appuser/.cache/pypoetry/venvs \
POETRY_CACHE_DIR=/home/appuser/.cache/pypoetry/cache \
HF_HUB_CACHE=/app/.cache/huggingface \
TRANSFORMERS_CACHE=/app/.cache/transformers \
SENTENCE_TRANSFORMERS_HOME=/app/.cache/sentence_transformers
# 🔧 시스템 패키지 설치
RUN apt-get update && apt-get install -y --no-install-recommends \
build-essential \
gcc \
g++ \
python3-dev \
curl \
wget \
ca-certificates \
git \
sudo \
lsb-release \
bc \
python3.11 \
python3.11-venv \
python3.11-dev \
python3.11-distutils \
&& rm -rf /var/lib/apt/lists/* \
&& apt-get clean
# 📦 pip 업그레이드
RUN python3.11 -m pip install --no-cache-dir --upgrade pip setuptools wheel
# 👤 비root 사용자 생성 (Poetry 설치 전에)
RUN groupadd -r appuser && \
useradd -r -g appuser -d /home/appuser -s /bin/bash appuser && \
mkdir -p /home/appuser && \
chown -R appuser:appuser /home/appuser
# 🔧 Poetry 가상환경 디렉토리 생성 (홈 디렉토리 사용)
RUN mkdir -p /home/appuser/.cache/pypoetry/venvs \
/home/appuser/.cache/pypoetry/cache && \
chown -R appuser:appuser /home/appuser/.cache && \
chmod -R 755 /home/appuser/.cache
# 🐍 Poetry를 appuser로 설치
USER appuser
ENV PATH="/home/appuser/.local/bin:$PATH"
# appuser 홈 디렉토리에 Poetry 설치
RUN curl -sSL https://install.python-poetry.org | python3.11 -
# Poetry 실행 권한 및 심볼릭 링크 (root 권한 필요)
USER root
RUN chmod +x /home/appuser/.local/bin/poetry && \
ln -sf /home/appuser/.local/bin/poetry /usr/local/bin/poetry && \
chown appuser:appuser /home/appuser/.local/bin/poetry
# appuser로 다시 전환
USER appuser
# 🔧 Poetry 설정 - 가상환경을 홈 디렉토리로 이동
RUN poetry config virtualenvs.in-project false && \
poetry config virtualenvs.create true && \
poetry config virtualenvs.path /home/appuser/.cache/pypoetry/venvs && \
poetry config cache-dir /home/appuser/.cache/pypoetry/cache
# Poetry 버전 확인 및 설정 검증
RUN poetry --version && \
poetry config --list && \
ls -la /home/appuser/.local/bin/poetry && \
which poetry
# 🏗️ 작업 디렉토리 설정 및 권한 조정
WORKDIR /app
# root로 전환하여 디렉토리 소유권 설정
USER root
RUN chown -R appuser:appuser /app
# 📋 Poetry 설치 스크립트 복사 및 권한 설정
COPY setup.sh /app/setup.sh
RUN chmod +x /app/setup.sh && \
chown appuser:appuser /app/setup.sh
# appuser로 전환하여 Poetry 환경 설정
USER appuser
# 🚀 Poetry 환경 설정 및 의존성 설치
RUN cd /app && \
export DEBIAN_FRONTEND=noninteractive && \
./setup.sh --skip-poetry-install --skip-python311-check --force-reinstall
# 🗂️ 필요한 디렉토리 생성 및 권한 설정
USER root
RUN mkdir -p /app/.cache/huggingface \
/app/.cache/transformers \
/app/.cache/sentence_transformers \
/app/vectordb \
/app/data \
/app/logs && \
chmod -R 755 /app/.cache /app/vectordb /app/data /app/logs && \
chown -R appuser:appuser /app && \
# Poetry 가상환경 디렉토리 권한 재확인
chown -R appuser:appuser /home/appuser/.cache && \
chmod -R 755 /home/appuser/.cache
# 🧹 캐시 정리
RUN rm -rf /tmp/* /var/tmp/*
# 🚀 포트 노출
EXPOSE 8000
# 🏥 간단한 헬스체크 (appuser 권한으로 실행)
HEALTHCHECK --interval=30s --timeout=10s --start-period=60s --retries=3 \
CMD su -c "poetry --version && poetry config virtualenvs.path" appuser || exit 1
# 👤 최종 사용자 설정
USER appuser
# 🎯 기본 명령어
CMD ["poetry", "--version"]
+63
View File
@@ -0,0 +1,63 @@
apiVersion: v1
kind: ConfigMap
metadata:
name: vector-api-config
data:
# 🔧 기존 애플리케이션 설정 (유지)
APP_TITLE: "음식점 Vector DB 구축 서비스"
APP_VERSION: "1.0.0"
APP_DESCRIPTION: "소상공인을 위한 AI 기반 경쟁업체 분석 및 액션 추천 시스템"
# 🔧 기존 서버 설정 (유지)
HOST: "0.0.0.0"
PORT: "8000"
LOG_LEVEL: "debug" # 디버깅을 위해 debug로 변경
# 🔧 기존 Restaurant API 설정 (K8s 환경, 유지)
RESTAURANT_API_HOST: "restaurant-api-service"
RESTAURANT_API_PORT: "80"
# 🔧 기존 Review API 설정 (K8s 환경, 유지)
REVIEW_API_HOST: "kakao-review-api-service"
REVIEW_API_PORT: "80"
# 🔧 기존 Claude API 설정 (유지)
CLAUDE_MODEL: "claude-sonnet-4-20250514"
# 🔧 기존 Vector DB 설정 (유지)
VECTOR_DB_PATH: "/app/vectordb"
VECTOR_DB_COLLECTION: "restaurant_reviews"
EMBEDDING_MODEL: "sentence-transformers/all-MiniLM-L6-v2"
# 🔧 기존 데이터 수집 설정 (유지)
MAX_RESTAURANTS_PER_CATEGORY: "50"
MAX_REVIEWS_PER_RESTAURANT: "100"
REQUEST_DELAY: "0.1"
REQUEST_TIMEOUT: "600"
# 🆕 ChromaDB 최신 버전 호환 설정 추가
CHROMA_DB_IMPL: "duckdb+parquet" # SQLite 대신 DuckDB 사용
ALLOW_RESET: "True"
ANONYMIZED_TELEMETRY: "False"
# 🆕 Python 최적화 설정
PYTHONUNBUFFERED: "1"
PYTHONDONTWRITEBYTECODE: "1"
# 🆕 캐시 디렉토리 설정
HF_HUB_CACHE: "/app/.cache/huggingface"
TRANSFORMERS_CACHE: "/app/.cache/transformers"
# 🆕 FastAPI 설정
FASTAPI_ENV: "production"
# 🆕 Uvicorn 설정
UVICORN_HOST: "0.0.0.0"
UVICORN_PORT: "8000"
UVICORN_LOG_LEVEL: "debug"
UVICORN_ACCESS_LOG: "true"
# 🆕 타임아웃 설정
STARTUP_TIMEOUT: "300" # 5분
SHUTDOWN_TIMEOUT: "30" # 30초
+164
View File
@@ -0,0 +1,164 @@
# deployment/manifests/deployment.yaml.fixed
apiVersion: apps/v1
kind: Deployment
metadata:
name: vector-api
labels:
app: vector-api
spec:
replicas: 1
selector:
matchLabels:
app: vector-api
template:
metadata:
labels:
app: vector-api
spec:
# 🔧 볼륨 권한 설정을 위한 initContainer
initContainers:
- name: volume-permissions
image: busybox:1.35
command:
- /bin/sh
- -c
- |
echo "=== 볼륨 권한 설정 시작 ==="
mkdir -p /app/vectordb
chown -R 1000:1000 /app/vectordb
chmod -R 755 /app/vectordb
echo "=== 볼륨 권한 설정 완료 ==="
volumeMounts:
- name: vector-db-storage
mountPath: /app/vectordb
securityContext:
runAsUser: 0
containers:
- name: vector-api
image: acrdigitalgarage03.azurecr.io/vector-api:latest
imagePullPolicy: Always
ports:
- containerPort: 8000
# 🔧 보안 컨텍스트
securityContext:
runAsNonRoot: true
runAsUser: 1000
runAsGroup: 1000
allowPrivilegeEscalation: false
readOnlyRootFilesystem: false
# 🔧 리소스 설정
resources:
requests:
memory: "4Gi"
cpu: "1000m"
limits:
memory: "8Gi"
cpu: "2000m"
# 🏥 헬스체크 설정
livenessProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 120
periodSeconds: 30
timeoutSeconds: 15
failureThreshold: 3
readinessProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 60
periodSeconds: 10
timeoutSeconds: 10
failureThreshold: 3
# 📂 볼륨 마운트
volumeMounts:
- name: vector-db-storage
mountPath: /app/vectordb
# ConfigMap 환경 변수
envFrom:
- configMapRef:
name: vector-api-config
# 🌍 환경변수 설정 (인증 필드 제거)
env:
- name: PYTHONUNBUFFERED
value: "1"
- name: PYTHONDONTWRITEBYTECODE
value: "1"
# 🔧 ChromaDB 기본 설정 (인증 필드 제거)
- name: ANONYMIZED_TELEMETRY
value: "False"
- name: CHROMA_DB_IMPL
value: "duckdb+parquet"
- name: ALLOW_RESET
value: "True"
# 🔧 로그 레벨
- name: LOG_LEVEL
value: "info"
# 🔧 Claude API (ConfigMap에서 가져오기)
- name: CLAUDE_API_KEY
valueFrom:
secretKeyRef:
name: vector-api-secret
key: CLAUDE_API_KEY
- name: CLAUDE_MODEL
valueFrom:
configMapKeyRef:
name: vector-api-config
key: CLAUDE_MODEL
# 🔧 기타 설정 (ConfigMap에서 가져오기)
- name: APP_TITLE
valueFrom:
configMapKeyRef:
name: vector-api-config
key: APP_TITLE
- name: APP_VERSION
valueFrom:
configMapKeyRef:
name: vector-api-config
key: APP_VERSION
# 📦 볼륨 설정
volumes:
- name: vector-db-storage
persistentVolumeClaim:
claimName: vector-db-pvc
# 🔐 이미지 Pull Secret
imagePullSecrets:
- name: acr-secret
# 🎯 노드 선택 및 배치 설정
nodeSelector:
agentpool: aipool
tolerations:
- key: "dedicated"
operator: "Equal"
value: "aipool"
effect: "NoSchedule"
affinity:
podAntiAffinity:
preferredDuringSchedulingIgnoredDuringExecution:
- weight: 100
podAffinityTerm:
labelSelector:
matchExpressions:
- key: app
operator: In
values:
- vector-api
topologyKey: kubernetes.io/hostname
restartPolicy: Always
dnsPolicy: ClusterFirst
+39
View File
@@ -0,0 +1,39 @@
# deployment/manifests/ingress.yaml
apiVersion: networking.k8s.io/v1
kind: Ingress
metadata:
name: vector-api-ingress
annotations:
nginx.ingress.kubernetes.io/rewrite-target: /
nginx.ingress.kubernetes.io/ssl-redirect: "false"
nginx.ingress.kubernetes.io/proxy-body-size: "10m"
# Vector DB 구축 시간을 고려한 긴 타임아웃 설정
nginx.ingress.kubernetes.io/proxy-read-timeout: "1800"
nginx.ingress.kubernetes.io/proxy-send-timeout: "1800"
nginx.ingress.kubernetes.io/client-body-timeout: "1800"
nginx.ingress.kubernetes.io/proxy-connect-timeout: "60"
# CORS 설정
nginx.ingress.kubernetes.io/enable-cors: "true"
nginx.ingress.kubernetes.io/cors-allow-origin: "*"
nginx.ingress.kubernetes.io/cors-allow-methods: "GET, POST, OPTIONS"
nginx.ingress.kubernetes.io/cors-allow-headers: "DNT,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Range,Authorization"
spec:
ingressClassName: nginx
rules:
# 환경에 맞게 호스트명 수정 필요
- host: vector-api.20.249.191.180.nip.io
http:
paths:
- path: /
pathType: Prefix
backend:
service:
name: vector-api-service
port:
number: 80
# TLS 설정 (HTTPS 필요시 주석 해제)
# tls:
# - hosts:
# - vector-api.example.com
# secretName: vector-api-tls
+18
View File
@@ -0,0 +1,18 @@
# deployment/manifests/pvc.yaml
apiVersion: v1
kind: PersistentVolumeClaim
metadata:
name: vector-db-pvc
labels:
app: vector-api
component: storage
spec:
accessModes:
- ReadWriteOnce
resources:
requests:
storage: 10Gi
storageClassName: managed
# 선택적: 특정 PV에 바인딩하려는 경우
# volumeName: vector-db-pv
+11
View File
@@ -0,0 +1,11 @@
# deployment/manifests/secret.yaml
apiVersion: v1
kind: Secret
metadata:
name: vector-api-secret
type: Opaque
data:
# Claude API 키 (Base64 인코딩 필요)
# echo -n "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" | base64
CLAUDE_API_KEY: c2stYW50LWFwaTAzLUVGM1ZocXJJUkVmY3hOa1V3ZkdENDluZ0k1SGZhcTUwd3c4WGZMd0psckR6akczdzNPSHRYTzFBZEltczJuRng2cmc4bk84cWhnMnFwUU01WFJnLTQ1SDdIQUFB
+17
View File
@@ -0,0 +1,17 @@
# deployment/manifests/service.yaml
apiVersion: v1
kind: Service
metadata:
name: vector-api-service
labels:
app: vector-api
spec:
type: ClusterIP
ports:
- port: 80
targetPort: 8000
protocol: TCP
name: http
selector:
app: vector-api