mirror of
https://github.com/Tencent/WeKnora.git
synced 2026-06-04 13:30:32 +08:00
- Bump base image in docker/Dockerfile.app from golang:1.24 to golang:1.26
to match `go 1.26` declared in go.mod (fixes CI build failure on
`go mod download`).
- Drop unused docreader components and their dependencies:
- Remove `docreader/ocr/` package (paddle/vlm/dummy backends are
unreferenced by the main flow; OCR/VLM is handled by the Go App).
- Remove `docreader/parser/storage.py` (dead code; image persistence
happens in the Go App via inline ImageRef bytes).
- Remove `docreader/scripts/download_deps.py` (PaddleOCR pre-download).
- Drop deps: paddleocr, paddlepaddle, openai, ollama, minio,
cos-python-sdk-v5, oss2, asyncio, pypdf2, markdown, mistletoe,
goose3, markdownify, pdfplumber, antiword, urllib3.
- Re-lock uv.lock: 145 -> 79 packages.
- Update docreader/README.md to reflect that OCR/VLM/storage are no
longer configured at the docreader level.
117 lines
3.6 KiB
Erlang
117 lines
3.6 KiB
Erlang
# Build stage
|
|
FROM golang:1.26-bookworm AS builder
|
|
|
|
WORKDIR /app
|
|
|
|
# 通过构建参数接收敏感信息
|
|
ARG GOPRIVATE_ARG
|
|
ARG GOPROXY_ARG
|
|
ARG GOSUMDB_ARG=off
|
|
ARG APK_MIRROR_ARG
|
|
|
|
# 设置Go环境变量
|
|
ENV GOPRIVATE=${GOPRIVATE_ARG}
|
|
ENV GOPROXY=${GOPROXY_ARG}
|
|
ENV GOSUMDB=${GOSUMDB_ARG}
|
|
|
|
# Install dependencies
|
|
RUN if [ -n "$APK_MIRROR_ARG" ]; then \
|
|
sed -i "s@deb.debian.org@${APK_MIRROR_ARG}@g" /etc/apt/sources.list.d/debian.sources; \
|
|
fi && \
|
|
apt-get update && \
|
|
apt-get install -y git build-essential libsqlite3-dev
|
|
|
|
# Install migrate tool
|
|
RUN go install -tags 'postgres' github.com/golang-migrate/migrate/v4/cmd/migrate@latest
|
|
|
|
# Copy go mod and sum files
|
|
COPY go.mod go.sum ./
|
|
RUN --mount=type=cache,target=/go/pkg/mod go mod download
|
|
COPY cmd/download cmd/download
|
|
RUN go run cmd/download/duckdb/duckdb.go
|
|
COPY . .
|
|
|
|
# Get version and commit info for build injection
|
|
ARG VERSION_ARG
|
|
ARG COMMIT_ID_ARG
|
|
ARG BUILD_TIME_ARG
|
|
ARG GO_VERSION_ARG
|
|
|
|
# Set build-time variables
|
|
ENV VERSION=${VERSION_ARG}
|
|
ENV COMMIT_ID=${COMMIT_ID_ARG}
|
|
ENV BUILD_TIME=${BUILD_TIME_ARG}
|
|
ENV GO_VERSION=${GO_VERSION_ARG}
|
|
|
|
# Build the application with version info
|
|
RUN --mount=type=cache,target=/go/pkg/mod make build-prod
|
|
RUN --mount=type=cache,target=/go/pkg/mod cp -r /go/pkg/mod/github.com/yanyiwu/ /app/yanyiwu/
|
|
|
|
# Final stage
|
|
FROM debian:12.12-slim
|
|
|
|
WORKDIR /app
|
|
|
|
ARG APK_MIRROR_ARG
|
|
|
|
# Create a non-root user first
|
|
RUN useradd -m -s /bin/bash appuser
|
|
|
|
# First, install ca-certificates without mirror to ensure HTTPS works
|
|
RUN apt-get update && \
|
|
apt-get install -y --no-install-recommends ca-certificates && \
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
# Then switch to mirror if specified and install other packages
|
|
RUN if [ -n "$APK_MIRROR_ARG" ]; then \
|
|
sed -i "s@deb.debian.org@${APK_MIRROR_ARG}@g" /etc/apt/sources.list.d/debian.sources; \
|
|
fi && \
|
|
apt-get update && \
|
|
apt-get install -y --no-install-recommends \
|
|
build-essential postgresql-client default-mysql-client tzdata sed curl bash vim wget \
|
|
libsqlite3-0 \
|
|
python3 python3-pip python3-dev libffi-dev libssl-dev \
|
|
nodejs npm \
|
|
gosu \
|
|
ffmpeg && \
|
|
python3 -m pip install --break-system-packages --upgrade pip setuptools wheel && \
|
|
mkdir -p /home/appuser/.local/bin && \
|
|
curl -LsSf https://astral.sh/uv/install.sh | CARGO_HOME=/home/appuser/.cargo UV_INSTALL_DIR=/home/appuser/.local/bin sh && \
|
|
chown -R appuser:appuser /home/appuser && \
|
|
ln -sf /home/appuser/.local/bin/uvx /usr/local/bin/uvx && \
|
|
chmod +x /usr/local/bin/uvx && \
|
|
apt-get clean && \
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
# Create data directories and set permissions
|
|
RUN mkdir -p /data/files && \
|
|
chown -R appuser:appuser /app /data/files
|
|
|
|
# Copy migrate tool from builder stage
|
|
COPY --from=builder /go/bin/migrate /usr/local/bin/
|
|
COPY --from=builder /app/yanyiwu/ /go/pkg/mod/github.com/yanyiwu/
|
|
|
|
# Copy the binary from the builder stage
|
|
COPY --from=builder /app/config ./config
|
|
COPY --from=builder /app/scripts ./scripts
|
|
COPY --from=builder /app/migrations ./migrations
|
|
COPY --from=builder /app/dataset/samples ./dataset/samples
|
|
COPY --from=builder /app/skills/preloaded ./skills/preloaded
|
|
# Keep a read-only backup so bind-mount cannot erase built-in skills
|
|
COPY --from=builder /app/skills/preloaded ./skills/_builtin
|
|
COPY --from=builder /root/.duckdb /home/appuser/.duckdb
|
|
COPY --from=builder /app/WeKnora .
|
|
|
|
# Copy and make entrypoint script executable
|
|
COPY --from=builder /app/scripts/docker-entrypoint.sh ./scripts/docker-entrypoint.sh
|
|
|
|
# Make scripts executable
|
|
RUN chmod +x ./scripts/*.sh
|
|
|
|
# Expose ports
|
|
EXPOSE 8080
|
|
|
|
|
|
ENTRYPOINT ["./scripts/docker-entrypoint.sh"]
|
|
CMD ["./WeKnora"]
|