import rtx_api_3_5 as rtx_api
response = rtx_api.send_message("write fire emoji")
print(response)
Chat With RTX builds int4 (W4A16 AWQ) tensortRT engines for mistral 7b and llama2 13b
On my 4090
mistral 130 tok/s
lama 75 tok/s
LICENSE: CC0
import rtx_api_3_5 as rtx_api
response = rtx_api.send_message("write fire emoji")
print(response)
Chat With RTX builds int4 (W4A16 AWQ) tensortRT engines for mistral 7b and llama2 13b
On my 4090
mistral 130 tok/s
lama 75 tok/s
LICENSE: CC0