Blog post available at: https://dev.premai.io/blog/llm-fastapi-docker
docker build --file ./Dockerfile \
--build-arg="MODEL_ID=tiiuae/falcon-7b-instruct" \
--tag blog-post/chat-falcon-7b-instruct-gpu:latest \
--tag blog-post/chat-falcon-7b-instruct-gpu:0.0.1 \
.
docker run --gpus all -p 8000:8000 blog-post/chat-falcon-7b-instruct-gpu:latest