https://www.anyscale.com/blog/a-comprehensive-guide-for-building-rag-based-llm-applications-part-1
https://www.anyscale.com/blog/turbocharge-langchain-now-guide-to-20x-faster-embedding
aws ecr get-login-password --region us-east-1 | docker login --username AWS --password-stdin 665577950062.dkr.ecr.us-east-1.amazonaws.com
docker compose build -t ray-example:latest . docker tag ray-example:latest 665577950062.dkr.ecr.us-east-1.amazonaws.com/ray-example:latest docker push 665577950062.dkr.ecr.us-east-1.amazonaws.com/ray-example:latest
docker compose up -d
docker compose build -t ray-example . && docker compose up -d
docker build -t localbuild:ray-example .
docker build --no-cache -t ray-example .
docker system prune -f
RUN pip install ctransformers[cuda] echo "AWS_ACCESS_KEY_ID=$AWS_ACCESS_KEY_ID" >> /home/ubuntu/AWS_info.txt
curl http://localhost:8000/ray-example/ POST -H "Content-Type: application/json" -v -d '{"en_text": "Towards Certification of Machine Learning-Based Distributed Systems Behavior"}'
curl http://localhost:8000/translate/en/fr/ POST -H "Content-Type: application/json" -v -d '{"en_text": "Towards Certification of Machine Learning-Based Distributed Systems Behavior"}'
pip install git+https://github.com/huggingface/transformers