File size: 922 Bytes
5005caf
 
 
 
 
 
 
 
 
 
 
cc4cd30
 
 
 
 
 
5b6ee0c
 
cc4cd30
 
 
5b6ee0c
6ee281b
cc4cd30
 
 
 
5005caf
 
 
 
 
 
cc4cd30
5005caf
 
 
 
2763fd7
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
version: "3.8"

services:
  ml-backend:
    container_name: ml-backend
    image: humansignal/ml-backend:v0
    build:
      context: .
      args:
        TEST_ENV: ${TEST_ENV}
    environment:
      # Model settings
      - MODEL_NAME=google/flan-t5-base
      - MAX_LENGTH=512
      - GENERATION_MAX_LENGTH=128
      - NUM_RETURN_SEQUENCES=1
      # LoRA settings
      - LORA_R=16
      - LORA_ALPHA=16
      - LORA_DROPOUT=0.1
      - LORA_TARGET_MODULES=q,v
      # Training settings
      - NUM_EPOCHS=16
      - LEARNING_RATE=1e-5
      - BATCH_SIZE=1
      - MAX_STEPS=100
      - SAVE_STEPS=50
      # Other settings
      - BASIC_AUTH_USER=
      - BASIC_AUTH_PASS=
      - LOG_LEVEL=DEBUG
      - WORKERS=1
      - THREADS=8
      - MODEL_DIR=/data/models
      - HF_CHECKPOINT_DIR=/data/checkpoints
    ports:
      - "9090:9090"
    volumes:
      - "./data/server:/data"
# TODO: verify if the file is needed