File size: 3,701 Bytes
825f021
 
2f48b4a
 
825f021
7fb7065
825f021
 
 
 
 
 
 
65f1d1f
 
825f021
 
 
 
 
 
 
2f48b4a
 
 
 
 
 
0756b41
65f1d1f
 
0756b41
 
 
 
 
65f1d1f
 
825f021
65f1d1f
825f021
65f1d1f
825f021
 
 
 
 
 
 
 
65f1d1f
 
 
 
 
 
 
 
 
825f021
 
 
 
 
 
 
 
 
 
 
 
 
 
b177c43
 
825f021
 
 
 
2f48b4a
825f021
 
 
 
 
 
 
 
 
 
 
 
 
 
2f48b4a
825f021
 
 
 
 
 
 
 
 
 
2f48b4a
825f021
 
 
 
 
2f48b4a
825f021
 
65f1d1f
825f021
65f1d1f
 
825f021
 
65f1d1f
b177c43
65f1d1f
 
825f021
65f1d1f
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
#!/bin/bash

set -e  # Exit on error

# Default values
CONFIG_FILE="main/resources/local_config.yaml"
ENV_FILE=".env"
CONTAINER_NAME="llm-inference-server"
BUILD_ONLY=false
PLATFORM=""

# Function to display usage
usage() {
    echo "Usage: $0 [-c <config_file>] [-e <env_file>] [-n <container_name>] [-b] [-h]"
    echo "  -c : Config file path (default: resources/local_config.yaml)"
    echo "  -e : Environment file path (default: .env)"
    echo "  -n : Container name (default: llm-inference-server)"
    echo "  -b : Build only (don't run container)"
    echo "  -h : Display this help message"
    exit 1
}

# Function to handle errors
handle_error() {
    echo "Error: $1"
    exit 1
}

# Function to read yaml using grep and sed
parse_yaml() {
    local file=$1
    # Get port - look for port under server section and extract the number
    PORT=$(grep -A5 "^server:" "$file" | grep "port:" | sed 's/[^0-9]*//g')
    # Get host - look for host under server section and extract the value in quotes
    HOST=$(grep -A5 "^server:" "$file" | grep "host:" | sed 's/.*"//;s/".*//')
    echo "$PORT $HOST"
}

# Parse command line arguments
while getopts "c:e:n:bh" opt; do
    case $opt in
        c) CONFIG_FILE=$OPTARG ;;
        e) ENV_FILE=$OPTARG ;;
        n) CONTAINER_NAME=$OPTARG ;;
        b) BUILD_ONLY=true ;;
        h) usage ;;
        ?) usage ;;
    esac
done

# Check if config file exists
if [ ! -f "$CONFIG_FILE" ]; then
    handle_error "Config file not found: $CONFIG_FILE"
fi

# Read port and host from config
read PORT HOST < <(parse_yaml "$CONFIG_FILE")
echo "Using configuration - Port: $PORT, Host: $HOST"

# Detect platform and set appropriate options
if [[ "$(uname -s)" == "Darwin" ]]; then
    echo "Detected MacOS platform"
    PLATFORM="linux/arm64"
    if [[ "$(uname -m)" == "x86_64" ]]; then
        PLATFORM="linux/amd64"
    fi
    PLATFORM_ARG="--platform=${PLATFORM}"
else
    echo "Detected Linux platform"
    # Check if podman is available (common in RHEL environments)
    if command -v podman &> /dev/null; then
        echo "Podman detected, using podman instead of docker"
        function docker { podman "${@}"; }
    fi
    PLATFORM_ARG=""
fi

# Check if docker is installed
if ! command -v docker &> /dev/null; then
    handle_error "Docker is not installed"
fi

# Check if .env file exists
if [ ! -f "$ENV_FILE" ]; then
    echo "Warning: $ENV_FILE file not found"
    echo "Creating sample $ENV_FILE file..."
    cat > "$ENV_FILE" << EOL
InfAPITokenWrite=your_huggingface_token_here
EOL
    echo "Please edit $ENV_FILE with your actual configuration"
fi

# Build the Docker image
echo "Building Docker image..."
docker build $PLATFORM_ARG -t $CONTAINER_NAME . || handle_error "Failed to build Docker image"

# Exit if build only
if [ "$BUILD_ONLY" = true ]; then
    echo "Build completed. Exiting as requested."
    exit 0
fi

# Check if container is already running
if docker ps -q -f name=$CONTAINER_NAME | grep -q .; then
    echo "Stopping existing container..."
    docker stop $CONTAINER_NAME || handle_error "Failed to stop existing container"
fi

# Remove existing container
if docker ps -aq -f name=$CONTAINER_NAME | grep -q .; then
    echo "Removing existing container..."
    docker rm $CONTAINER_NAME || handle_error "Failed to remove existing container"
fi

# Run the container in interactive mode
echo "Starting container on port $PORT..."
echo "Press Ctrl+C to stop the server"
docker run --rm -it \
    --name $CONTAINER_NAME \
    --env-file $ENV_FILE \
    -p $PORT:$PORT \
    -v $HOME/.cache/huggingface:/app/.cache/huggingface \
    -v "$(pwd)/$CONFIG_FILE:/app/$CONFIG_FILE" \
    $CONTAINER_NAME

echo "Container stopped"