whispering/whispering/serve.py

#!/usr/bin/env python3

import asyncio
import json
from logging import getLogger
from typing import Final, Optional

import numpy as np
import websockets
from websockets.exceptions import ConnectionClosedOK

from whispering.schema import CURRENT_PROTOCOL_VERSION, Context
from whispering.transcriber import WhisperStreamingTranscriber

logger = getLogger(__name__)

MIN_PROTOCOL_VERSION: Final[int] = int("000_006_000")
MAX_PROTOCOL_VERSION: Final[int] = CURRENT_PROTOCOL_VERSION


async def serve_with_websocket_main(websocket):
    global g_wsp
    idx: int = 0
    ctx: Optional[Context] = None

    while True:
        logger.debug(f"Audio #: {idx}")
        try:
            message = await websocket.recv()
        except ConnectionClosedOK:
            break

        if isinstance(message, str):
            logger.debug(f"Got str: {message}")
            d = json.loads(message)
            v = d.get("context")
            if v is not None:
                ctx = Context.parse_obj(v)
            else:
                await websocket.send(
                    json.dumps(
                        {
                            "error": "unsupported message",
                        }
                    )
                )
                return

            if ctx.protocol_version < MIN_PROTOCOL_VERSION:
                await websocket.send(
                    json.dumps(
                        {
                            "error": f"protocol_version is older than {MIN_PROTOCOL_VERSION}"
                        }
                    )
                )
            elif ctx.protocol_version > MAX_PROTOCOL_VERSION:
                await websocket.send(
                    json.dumps(
                        {
                            "error": f"protocol_version is newer than {MAX_PROTOCOL_VERSION}"
                        }
                    )
                )
                return

            continue

        logger.debug(f"Message size: {len(message)}")
        if ctx is None:
            await websocket.send(
                json.dumps(
                    {
                        "error": "no context",
                    }
                )
            )
            return
        audio = np.frombuffer(message, dtype=np.dtype(ctx.data_type)).astype(np.float32)
        for chunk in g_wsp.transcribe(
            audio=audio,  # type: ignore
            ctx=ctx,
        ):
            await websocket.send(chunk.json())
        idx += 1


async def serve_with_websocket(
    *,
    wsp: WhisperStreamingTranscriber,
    host: str,
    port: int,
):
    logger.info(f"Serve at {host}:{port}")
    logger.info("Make secure with your responsibility!")
    global g_wsp
    g_wsp = wsp

    try:
        async with websockets.serve(  # type: ignore
            serve_with_websocket_main,
            host=host,
            port=port,
            max_size=999999999,
        ):
            await asyncio.Future()
    except KeyboardInterrupt:
        pass
Add websocket server 2022-09-24 11:45:20 +00:00			`#!/usr/bin/env python3`

			`import asyncio`
Removed ctx from server 2022-10-02 12:59:02 +00:00			`import json`
Add websocket server 2022-09-24 11:45:20 +00:00			`from logging import getLogger`
Add protocol_version 2022-10-15 04:23:00 +00:00			`from typing import Final, Optional`
Add websocket server 2022-09-24 11:45:20 +00:00
			`import numpy as np`
			`import websockets`
Use different context for each connection 2022-10-01 14:55:12 +00:00			`from websockets.exceptions import ConnectionClosedOK`
Add websocket server 2022-09-24 11:45:20 +00:00
Updated protocol version 2022-10-17 13:09:23 +00:00			`from whispering.schema import CURRENT_PROTOCOL_VERSION, Context`
Fix None access bug 2022-10-17 12:46:15 +00:00			`from whispering.transcriber import WhisperStreamingTranscriber`
Add websocket server 2022-09-24 11:45:20 +00:00
			`logger = getLogger(__name__)`

Add protocol_version 2022-10-15 04:23:00 +00:00			`MIN_PROTOCOL_VERSION: Final[int] = int("000_006_000")`
Updated protocol version 2022-10-17 13:09:23 +00:00			`MAX_PROTOCOL_VERSION: Final[int] = CURRENT_PROTOCOL_VERSION`
Add protocol_version 2022-10-15 04:23:00 +00:00
Add websocket server 2022-09-24 11:45:20 +00:00
			`async def serve_with_websocket_main(websocket):`
			`global g_wsp`
			`idx: int = 0`
Removed ctx from server 2022-10-02 12:59:02 +00:00			`ctx: Optional[Context] = None`
Add websocket server 2022-09-24 11:45:20 +00:00
			`while True:`
Fix 2022-10-02 10:48:41 +00:00			`logger.debug(f"Audio #: {idx}")`
Use different context for each connection 2022-10-01 14:55:12 +00:00			`try:`
			`message = await websocket.recv()`
			`except ConnectionClosedOK:`
			`break`
Add websocket server 2022-09-24 11:45:20 +00:00
			`if isinstance(message, str):`
			`logger.debug(f"Got str: {message}")`
Send context 2022-10-02 13:02:17 +00:00			`d = json.loads(message)`
			`v = d.get("context")`
			`if v is not None:`
			`ctx = Context.parse_obj(v)`
			`else:`
			`await websocket.send(`
			`json.dumps(`
			`{`
			`"error": "unsupported message",`
			`}`
			`)`
			`)`
			`return`
Add protocol_version 2022-10-15 04:23:00 +00:00
			`if ctx.protocol_version < MIN_PROTOCOL_VERSION:`
			`await websocket.send(`
			`json.dumps(`
			`{`
			`"error": f"protocol_version is older than {MIN_PROTOCOL_VERSION}"`
			`}`
			`)`
			`)`
			`elif ctx.protocol_version > MAX_PROTOCOL_VERSION:`
			`await websocket.send(`
			`json.dumps(`
			`{`
			`"error": f"protocol_version is newer than {MAX_PROTOCOL_VERSION}"`
			`}`
			`)`
			`)`
			`return`

Add websocket server 2022-09-24 11:45:20 +00:00			`continue`

			`logger.debug(f"Message size: {len(message)}")`
Removed ctx from server 2022-10-02 12:59:02 +00:00			`if ctx is None:`
			`await websocket.send(`
			`json.dumps(`
			`{`
			`"error": "no context",`
			`}`
			`)`
			`)`
			`return`
Fix None access bug 2022-10-17 12:46:15 +00:00			`audio = np.frombuffer(message, dtype=np.dtype(ctx.data_type)).astype(np.float32)`
Fix (openai/whisper@7cb4cc2) 2022-10-01 14:20:46 +00:00			`for chunk in g_wsp.transcribe(`
Fix 2022-10-02 10:48:41 +00:00			`audio=audio, # type: ignore`
Use different context for each connection 2022-10-01 14:55:12 +00:00			`ctx=ctx,`
Fix (openai/whisper@7cb4cc2) 2022-10-01 14:20:46 +00:00			`):`
Changed protocol 2022-09-24 12:39:30 +00:00			`await websocket.send(chunk.json())`
Add websocket server 2022-09-24 11:45:20 +00:00			`idx += 1`


			`async def serve_with_websocket(`
			`*,`
			`wsp: WhisperStreamingTranscriber,`
			`host: str,`
			`port: int,`
			`):`
			`logger.info(f"Serve at {host}:{port}")`
			`logger.info("Make secure with your responsibility!")`
			`global g_wsp`
			`g_wsp = wsp`

			`try:`
			`async with websockets.serve( # type: ignore`
			`serve_with_websocket_main,`
			`host=host,`
			`port=port,`
			`max_size=999999999,`
			`):`
			`await asyncio.Future()`
			`except KeyboardInterrupt:`
			`pass`