Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
12 changes: 6 additions & 6 deletions .env.example
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,7 @@ EMBEDDING_MAX_SEQ_LENGTH=512
EMBEDDING_NORMALIZE=true
EMBEDDING_SHOW_PROGRESS=true
EMBEDDING_USE_PREFIXES=true
# (domyślnie w settings są spacje po dwukropku)
# (by default, set to "true" to improve multilingual embedding quality)
EMBEDDING_QUERY_PREFIX=query:
EMBEDDING_PASSAGE_PREFIX=passage:

Expand Down Expand Up @@ -99,14 +99,14 @@ MULTIHOP_ADAPTIVE_TOP_K=true
# LLM (provider selection + local Ollama)
# ─────────────────────────────────────────────────────────────────────────────
LLM_MODEL=Qwen/Qwen3-8B-Instruct
LLM_MODEL_NAME_OLLAMA=qwen3:14b
LLM_MODEL_NAME_OLLAMA=qwen3:8b
LLM_PROVIDER=ollama
OLLAMA_HOST=http://localhost:11434
# OLLAMA_MODELS_PATH (opcjonalne) – zostaw puste jeśli nie używasz
# OLLAMA_MODELS_PATH (opcjonalne) – leave blank if not needed
# OLLAMA_MODELS_PATH=E:\Models\Ollama\.ollama\models

# ─────────────────────────────────────────────────────────────────────────────
# LLM – parametry wspólne
# LLM – shared params
# ─────────────────────────────────────────────────────────────────────────────
LLM_MAX_NEW_TOKENS=16384
LLM_DEVICE=cuda
Expand All @@ -116,14 +116,14 @@ LLM_TOP_P=0.9
REPETITION_PENALTY=1.1

# ─────────────────────────────────────────────────────────────────────────────
# LLM (HTTP API – używane, gdy LLM_PROVIDER ≠ ollama)
# LLM (HTTP API – used, when LLM_PROVIDER ≠ ollama)
# ─────────────────────────────────────────────────────────────────────────────
LLM_API_BASE_URL=https://dashscope-intl.aliyuncs.com/compatible-mode/v1
LLM_API_KEY=...
LLM_API_MODEL_NAME=qwen3-32b

# ─────────────────────────────────────────────────────────────────────────────
# vLLM (ignorowane, gdy LLM_PROVIDER=ollama)
# vLLM (ignored, when LLM_PROVIDER=ollama)
# ─────────────────────────────────────────────────────────────────────────────
TENSOR_PARALLEL_SIZE=1
GPU_MEMORY_UTILIZATION=0.9
Expand Down
11 changes: 0 additions & 11 deletions Dockerfile
Original file line number Diff line number Diff line change
@@ -1,23 +1,17 @@
FROM python:3.12-slim

# Set working directory
WORKDIR /app

# Install system dependencies
RUN apt-get update && apt-get install -y \
build-essential \
curl \
wget \
git \
&& rm -rf /var/lib/apt/lists/*

# Copy requirements/pyproject
COPY pyproject.toml README.md ./

# Install uv for faster package management (optional)
RUN pip install --no-cache-dir uv

# Install Python dependencies
RUN uv pip install --system --no-cache \
wikiextractor \
qdrant-client \
Expand All @@ -40,20 +34,15 @@ RUN uv pip install --system --no-cache \
click \
python-dotenv

# Download NLTK data
RUN python -c "import nltk; nltk.download('punkt')"

# Copy source code
COPY src ./src
COPY configs ./configs
COPY scripts ./scripts

# Create necessary directories
RUN mkdir -p /app/data/raw /app/data/processed /app/data/index /app/logs

# Set environment variables
ENV PYTHONUNBUFFERED=1
ENV PYTHONPATH=/app:$PYTHONPATH

# Default command
CMD ["python", "-c", "print('RAGx container ready')"]
Loading