synthetic-data-generator / docker /.env.docker.template
daqc's picture
Add Ollama hardware configuration options
ff96bee
# =============================================================================
# DOCKER CONFIGURATION ONLY - FULL SETUP (APP + OLLAMA + ARGILLA)
# =============================================================================
# Note: Before building:
# 1. Copy this template to the root directory: cp docker/.env.docker.template .env
# 2. Comment/uncomment the sections you want to use (OLLAMA and/or ARGILLA)
# 3. Then build and run with the appropriate docker compose command
# Hugging Face token with read/write permissions
HF_TOKEN=your_token_here
# -----------------------------------------------------------------------------
# GENERATION SETTINGS
# -----------------------------------------------------------------------------
MAX_NUM_TOKENS=2048
MAX_NUM_ROWS=1000
DEFAULT_BATCH_SIZE=5
# -----------------------------------------------------------------------------
# OLLAMA DOCKER CONFIGURATION
# -----------------------------------------------------------------------------
OLLAMA_BASE_URL=http://ollama:11434
OLLAMA_HARDWARE=latest # latest (for CPU/NVIDIA), rocm (for AMD)
# LLAMA 3.2
MODEL=llama3.2:1b
TOKENIZER_ID=meta-llama/Llama-3.2-1B-Instruct
MAGPIE_PRE_QUERY_TEMPLATE=llama3
# DEEPSEEK R1
#MODEL=deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
#TOKENIZER_ID=deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
#MAGPIE_PRE_QUERY_TEMPLATE= "<|begin▁of▁sentence|>User: "
# -----------------------------------------------------------------------------
# ARGILLA DOCKER CONFIGURATION (persistent data)
# -----------------------------------------------------------------------------
ARGILLA_API_URL=http://argilla:6900
ARGILLA_USERNAME=admin
ARGILLA_PASSWORD=admin1234
ARGILLA_API_KEY=admin.1234
ARGILLA_REINDEX_DATASET=1