Files
Open-Assistant/inference/text-client/__main__.py
T
Yannic Kilcher 90c3d5640e Added database to inference server (#1446)
* added db for inference

* fixed dockerfiles for inference
2023-02-10 22:51:35 +01:00

51 lines
1.5 KiB
Python

"""Simple REPL frontend."""
import json
import time
import requests
import sseclient
import typer
app = typer.Typer()
@app.command()
def main(backend_url: str = "http://127.0.0.1:8000"):
"""Simple REPL client."""
while True:
try:
chat_id = requests.post(f"{backend_url}/chat", json={}).json()["id"]
typer.echo(f"Chat ID: {chat_id}")
while True:
message = typer.prompt("User").strip()
# wait for stream to be ready
# could implement a queue position indicator
# could be implemented with long polling
# but server load needs to be considered
response = requests.post(
f"{backend_url}/chat/{chat_id}/message",
json={"message": message},
stream=True,
headers={"Accept": "text/event-stream"},
)
response.raise_for_status()
client = sseclient.SSEClient(response)
print("Assistant: ", end="", flush=True)
for event in client.events():
data = json.loads(event.data)
print(data["token"]["text"], end="", flush=True)
print()
except typer.Abort:
typer.echo("Exiting...")
break
except Exception:
typer.echo("Error, restarting chat...")
time.sleep(1)
if __name__ == "__main__":
app()