asr + llama + tts
- CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install llama-cpp-python
- pip install -r requirements.txt
- .txt
github: https://github.com/Chainlit/chainlit
doc: https://docs.chainlit.io/get-started/overview
./talk-llama -mw ./models/ggml-base.en.bin -ml ../llama.cpp/models/7B/zephyr-7b-beta-pl.Q8_0.gguf -p "Georgi" -t 8
openssl req -newkey rsa:2048 -nodes -keyout rsa_private.key -x509 -days 799 -out cert.crt
zephyr-7b-beta -> Mistral-7B-v0.1(4096)