ia-test/Dockerfile

# Variante 1 (ta base actuelle)
FROM quay.io/go-skynet/local-ai:latest

# (facultatif) si l'image ne contient pas curl :
# RUN apk add --no-cache curl || (apt-get update && apt-get install -y curl ca-certificates)

ENV MODELS_PATH=/models \
    DEBUG=false \
    THREADS=2 \
    CONTEXT_SIZE=1024

# Crée le dossier des modèles
RUN mkdir -p /models

# Télécharge un petit modèle chat (TinyLlama 1.1B quantisé Q4) AU BUILD
# => Embarqué dans l'image, pas besoin de réseau à l'exécution pour ce fichier.
RUN curl -L -o /models/tinyllama-1.1b-chat.Q4_K_M.gguf \
    https://huggingface.co/Skynet-LocalAI/tinyllama-1.1b-chat.Q4_K_M.gguf
# IMPORTANT : on utilise un heredoc NON quoted (<<YAML) pour EXPANSION des variables
# (n_ctx/n_threads prendront les valeurs de CONTEXT_SIZE/THREADS AU BUILD)
RUN cat > /models/gpt-oss-20b.yaml <<YAML
name: gpt-oss-20b
backend: llama
parameters:
  model: tinyllama-1.1b-chat.Q4_K_M.gguf
  n_ctx: ${CONTEXT_SIZE}
  n_threads: ${THREADS}
  temperature: 0.2
  top_p: 0.9
YAML

# Le démarrage du serveur est piloté par docker-compose via `command`
up 2025-08-16 16:33:03 +00:00			`# Variante 1 (ta base actuelle)`
first 2025-08-16 14:26:36 +00:00			`FROM quay.io/go-skynet/local-ai:latest`

up 2025-08-16 16:33:03 +00:00			`# (facultatif) si l'image ne contient pas curl :`
			`# RUN apk add --no-cache curl \|\| (apt-get update && apt-get install -y curl ca-certificates)`
UP 2025-08-16 14:32:48 +00:00
first 2025-08-16 14:26:36 +00:00			`ENV MODELS_PATH=/models \`
			`DEBUG=false \`
			`THREADS=2 \`
			`CONTEXT_SIZE=1024`

			`# Crée le dossier des modèles`
			`RUN mkdir -p /models`

up 2025-08-16 16:33:03 +00:00			`# Télécharge un petit modèle chat (TinyLlama 1.1B quantisé Q4) AU BUILD`
			`# => Embarqué dans l'image, pas besoin de réseau à l'exécution pour ce fichier.`
up 2025-08-16 16:33:30 +00:00			`RUN curl -L -o /models/tinyllama-1.1b-chat.Q4_K_M.gguf \`
			`https://huggingface.co/Skynet-LocalAI/tinyllama-1.1b-chat.Q4_K_M.gguf`
up 2025-08-16 16:33:03 +00:00			`# IMPORTANT : on utilise un heredoc NON quoted (<<YAML) pour EXPANSION des variables`
			`# (n_ctx/n_threads prendront les valeurs de CONTEXT_SIZE/THREADS AU BUILD)`
			`RUN cat > /models/gpt-oss-20b.yaml <<YAML`
UP 2025-08-16 14:32:48 +00:00			`name: gpt-oss-20b`
first 2025-08-16 14:26:36 +00:00			`backend: llama`
			`parameters:`
			`model: tinyllama-1.1b-chat.Q4_K_M.gguf`
UP 2025-08-16 14:32:48 +00:00			`n_ctx: ${CONTEXT_SIZE}`
			`n_threads: ${THREADS}`
first 2025-08-16 14:26:36 +00:00			`temperature: 0.2`
			`top_p: 0.9`
UP 2025-08-16 14:32:48 +00:00			`YAML`
first 2025-08-16 14:26:36 +00:00
up 2025-08-16 16:33:03 +00:00			# Le démarrage du serveur est piloté par docker-compose via `command`