Merge pull request #18 from codeforequity-at/BOT-2087-rasa-channel

Botium · web-flow · commit 08fea72f9047 · 2021-01-26T12:02:02.000+01:00
BOT-2087-rasa-channel
diff --git a/.gitignore b/.gitignore
@@ -1,2 +1,3 @@
 logs
-docker-compose.override.yml
+docker-compose.override.yml
+__pycache__
diff --git a/README.md b/README.md
@@ -24,6 +24,7 @@ Some examples what you can do with this:
 
 * Synthesize audio tracks for Youtube tutorials
 * Build voice-enabled chatbot services (for example, IVR systems)
+  * see the [Rasa Custom Voice Channel](./connectors/rasa)
 * Classification of audio file transcriptions
 * [Automated Testing](https://chatbotslife.com/testing-alexa-skills-with-avs-mocha-and-botium-f6c22549f66e) of Voice services with [Botium](https://medium.com/@floriantreml/botium-in-a-nutshell-part-1-overview-f8d0ceaf8fb4)
 
@@ -154,6 +155,11 @@ This project is standing on the shoulders of giants.
 
 ## Changelog
 
+### 2021-01-26
+
+* Added several profiles for adding noise or other audio artifacts to your files
+* Added custom channel for usage with Rasa
+
 ### 2020-12-18
 
 * Adding support for Google Text-To-Speech
diff --git a/connectors/rasa/Makefile b/connectors/rasa/Makefile
@@ -0,0 +1,4 @@
+RASADIR=/home/ftreml/dev/rasa/examples/concertbot
+
+rasa_run:
+		cd $(RASADIR) && PYTHONPATH=$(PWD) rasa run -vv --cors "*" --credentials $(PWD)/credentials.yml
diff --git a/connectors/rasa/Readme.md b/connectors/rasa/Readme.md
@@ -0,0 +1,52 @@
+# Rasa Custom Voice Channel
+
+This channel is an extension of the Socket.io-Channel and will
+
+* accept input as audio and convert it to text before handing it down the Rasa pipeline
+* convert text content received from the Rasa pipeline as response to audio and add it to the response
+
+## Installation
+
+Clone or download this repository.
+
+    > git clone https://github.com/codeforequity-at/botium-speech-processing.git
+
+Make this directory available for Python loading by pointing PYTHONPATH environment variable here.
+
+    > export PYHTONPATH=$PYTHONPATH:<clone-dir>/connectors/rasa
+
+Use the _credentials.yml_ file when launching Rasa.
+
+    > rasa run --credentials <clone-dir>/connectors/rasa/credentials.yml
+
+Or when using it with docker-compose, first copy the _connectors_ folder to your Rasa installation, and you can use a _docker-compose.yml_ file like this one:
+
+```
+version: '3.0'
+services:
+  rasa:
+    image: rasa/rasa:latest-full
+    ports:
+      - 5005:5005
+    volumes:
+      - ./:/app
+    environment:
+      PYTHONPATH: "/app/connectors/rasa:/app"
+      RASA_DUCKLING_HTTP_URL: http://rasa-duckling:8000
+    command: run -vv --cors "*" --credentials /app/connectors/rasa/credentials.yml --enable-api --model models/dialogue --endpoints endpoints.yml -t B0tium1234
+  rasa-actions:
+    build:
+      context: .
+    ports:
+      - 5055:5055
+  rasa-duckling:
+    image: rasa/duckling
+    ports:
+      - 8000:8000
+```
+
+## Testing
+
+There is a simple test client based on the [Rasa Voice Interface](https://github.com/RasaHQ/rasa-voice-interface) available.
+
+In the _client_ directory, change the Rasa endpoint in the _docker-compose.yml_ file, then launch the client and access the Web interface to give a chat to your Rasa chatbot.
diff --git a/connectors/rasa/botium/SocketIOVoiceInput.py b/connectors/rasa/botium/SocketIOVoiceInput.py
@@ -0,0 +1,280 @@
+import logging
+import uuid
+import base64
+from typing import Any, Awaitable, Callable, Dict, Iterable, List, Optional, Text
+
+from rasa.core.channels.channel import InputChannel, OutputChannel, UserMessage
+import rasa.shared.utils.io
+from sanic import Blueprint, response
+from sanic.request import Request
+from sanic.response import HTTPResponse
+from socketio import AsyncServer
+
+from urllib.request import urlopen, Request
+from urllib.parse import urlencode
+import json
+
+logger = logging.getLogger(__name__)
+
+print('Hello from SocketVoice')
+
+class SocketVoiceBlueprint(Blueprint):
+    def __init__(self, sio: AsyncServer, socketio_path, *args, **kwargs):
+        self.sio = sio
+        self.socketio_path = socketio_path
+        super().__init__(*args, **kwargs)
+
+    def register(self, app, options) -> None:
+        self.sio.attach(app, self.socketio_path)
+        super().register(app, options)
+
+
+class SocketIOVoiceOutput(OutputChannel):
+    @classmethod
+    def name(cls) -> Text:
+        return "socketiovoice"
+
+    def __init__(self, sio: AsyncServer, bot_message_evt: Text, botium_speech_url: Text, botium_speech_apikey: Text, botium_speech_language: Text, botium_speech_voice: Text) -> None:
+        self.sio = sio
+        self.bot_message_evt = bot_message_evt
+        self.botium_speech_url = botium_speech_url
+        self.botium_speech_apikey = botium_speech_apikey
+        self.botium_speech_language = botium_speech_language
+        self.botium_speech_voice = botium_speech_voice
+
+    async def _send_message(self, socket_id: Text, response: Any) -> None:
+        """Sends a message to the recipient using the bot event."""
+
+        if response.get("text"):
+          q = {
+            'text': response['text']
+          }
+          if self.botium_speech_voice:
+            q['voice'] = self.botium_speech_voice
+
+          audioEndpoint = f"{self.botium_speech_url}/api/tts/{self.botium_speech_language}?{urlencode(q)}"
+          audio = urlopen(audioEndpoint).read()
+          logger.debug(f"_send_message- Calling Speech Endpoint: {audioEndpoint}")
+
+          audioBase64 = base64.b64encode(audio).decode('ascii')
+          audioUri = "data:audio/wav;base64," + audioBase64
+          response['link'] = audioUri
+
+        await self.sio.emit(self.bot_message_evt, response, room=socket_id)
+
+    async def send_text_message(
+        self, recipient_id: Text, text: Text, **kwargs: Any
+    ) -> None:
+        """Send a message through this channel."""
+
+        for message_part in text.strip().split("\n\n"):
+            await self._send_message(recipient_id, {"text": message_part})
+
+    async def send_image_url(
+        self, recipient_id: Text, image: Text, **kwargs: Any
+    ) -> None:
+        """Sends an image to the output"""
+
+        message = {"attachment": {"type": "image", "payload": {"src": image}}}
+        await self._send_message(recipient_id, message)
+
+    async def send_text_with_buttons(
+        self,
+        recipient_id: Text,
+        text: Text,
+        buttons: List[Dict[Text, Any]],
+        **kwargs: Any,
+    ) -> None:
+        """Sends buttons to the output."""
+
+        # split text and create a message for each text fragment
+        # the `or` makes sure there is at least one message we can attach the quick
+        # replies to
+        message_parts = text.strip().split("\n\n") or [text]
+        messages = [{"text": message, "quick_replies": []} for message in message_parts]
+
+        # attach all buttons to the last text fragment
+        for button in buttons:
+            messages[-1]["quick_replies"].append(
+                {
+                    "content_type": "text",
+                    "title": button["title"],
+                    "payload": button["payload"],
+                }
+            )
+
+        for message in messages:
+            await self._send_message(recipient_id, message)
+
+    async def send_elements(
+        self, recipient_id: Text, elements: Iterable[Dict[Text, Any]], **kwargs: Any
+    ) -> None:
+        """Sends elements to the output."""
+
+        for element in elements:
+            message = {
+                "attachment": {
+                    "type": "template",
+                    "payload": {"template_type": "generic", "elements": element},
+                }
+            }
+
+            await self._send_message(recipient_id, message)
+
+    async def send_custom_json(
+        self, recipient_id: Text, json_message: Dict[Text, Any], **kwargs: Any
+    ) -> None:
+        """Sends custom json to the output"""
+
+        json_message.setdefault("room", recipient_id)
+
+        await self.sio.emit(self.bot_message_evt, **json_message)
+
+    async def send_attachment(
+        self, recipient_id: Text, attachment: Dict[Text, Any], **kwargs: Any
+    ) -> None:
+        """Sends an attachment to the user."""
+        await self._send_message(recipient_id, {"attachment": attachment})
+
+
+class SocketIOVoiceInput(InputChannel):
+    """A socket.io input channel."""
+
+    @classmethod
+    def name(cls) -> Text:
+        return "socketiovoice"
+
+    @classmethod
+    def from_credentials(cls, credentials: Optional[Dict[Text, Any]]) -> InputChannel:
+        credentials = credentials or {}
+        return cls(
+            credentials.get("user_message_evt", "user_uttered"),
+            credentials.get("bot_message_evt", "bot_uttered"),
+            credentials.get("namespace"),
+            credentials.get("session_persistence", False),
+            credentials.get("socketio_path", "/socket.io"),
+            credentials.get("botium_speech_url"),
+            credentials.get("botium_speech_apikey"),
+            credentials.get("botium_speech_language", "en"),
+            credentials.get("botium_speech_voice"),
+        )
+
+    def __init__(
+        self,
+        user_message_evt: Text = "user_uttered",
+        bot_message_evt: Text = "bot_uttered",
+        namespace: Optional[Text] = None,
+        session_persistence: bool = False,
+        socketio_path: Optional[Text] = "/socket.io",
+        botium_speech_url: Text = None,
+        botium_speech_apikey: Optional[Text] = None,
+        botium_speech_language: Text = "en",
+        botium_speech_voice: Optional[Text] = False,
+    ):
+        self.bot_message_evt = bot_message_evt
+        self.session_persistence = session_persistence
+        self.user_message_evt = user_message_evt
+        self.namespace = namespace
+        self.socketio_path = socketio_path
+        self.botium_speech_url = botium_speech_url
+        self.botium_speech_apikey = botium_speech_apikey
+        self.botium_speech_language = botium_speech_language
+        self.botium_speech_voice = botium_speech_voice
+        self.sio = None
+
+    def get_output_channel(self) -> Optional["OutputChannel"]:
+        if self.sio is None:
+            rasa.shared.utils.io.raise_warning(
+                "SocketIO output channel cannot be recreated. "
+                "This is expected behavior when using multiple Sanic "
+                "workers or multiple Rasa Open Source instances. "
+                "Please use a different channel for external events in these "
+                "scenarios."
+            )
+            return
+        return SocketIOVoiceOutput(self.sio, self.bot_message_evt, self.botium_speech_url, self.botium_speech_apikey, self.botium_speech_language, self.botium_speech_voice)
+
+    def blueprint(
+        self, on_new_message: Callable[[UserMessage], Awaitable[Any]]
+    ) -> Blueprint:
+        # Workaround so that socketio works with requests from other origins.
+        # https://github.com/miguelgrinberg/python-socketio/issues/205#issuecomment-493769183
+        sio = AsyncServer(async_mode="sanic", cors_allowed_origins=[])
+        socketio_webhook = SocketVoiceBlueprint(
+            sio, self.socketio_path, "socketio_webhook", __name__
+        )
+
+        # make sio object static to use in get_output_channel
+        self.sio = sio
+
+        @socketio_webhook.route("/", methods=["GET"])
+        async def health(_: Request) -> HTTPResponse:
+            return response.json({"status": "ok"})
+
+        @sio.on("connect", namespace=self.namespace)
+        async def connect(sid: Text, _) -> None:
+            logger.debug(f"User {sid} connected to socketIO endpoint.")
+
+        @sio.on("disconnect", namespace=self.namespace)
+        async def disconnect(sid: Text) -> None:
+            logger.debug(f"User {sid} disconnected from socketIO endpoint.")
+
+        @sio.on("session_request", namespace=self.namespace)
+        async def session_request(sid: Text, data: Optional[Dict]):
+            if data is None:
+                data = {}
+            if "session_id" not in data or data["session_id"] is None:
+                data["session_id"] = uuid.uuid4().hex
+            if self.session_persistence:
+                sio.enter_room(sid, data["session_id"])
+            await sio.emit("session_confirm", data["session_id"], room=sid)
+            logger.debug(f"User {sid} connected to socketIO endpoint.")
+
+        @sio.on(self.user_message_evt, namespace=self.namespace)
+        async def handle_message(sid: Text, data: Dict) -> Any:
+            output_channel = SocketIOVoiceOutput(sio, self.bot_message_evt, self.botium_speech_url, self.botium_speech_apikey, self.botium_speech_language, self.botium_speech_voice)
+
+            if self.session_persistence:
+                if not data.get("session_id"):
+                    rasa.shared.utils.io.raise_warning(
+                        "A message without a valid session_id "
+                        "was received. This message will be "
+                        "ignored. Make sure to set a proper "
+                        "session id using the "
+                        "`session_request` socketIO event."
+                    )
+                    return
+                sender_id = data["session_id"]
+            else:
+                sender_id = sid
+
+            if data['message'].startswith('data:'):
+                header, encoded = data['message'].split(",", 1)
+
+                audioData = base64.b64decode(encoded.encode('ascii'))
+
+                convertEndpoint = f"{self.botium_speech_url}/api/convert/WAVTOMONOWAV"
+                logger.debug(f"handle_message - Calling Convert Endpoint: {convertEndpoint}")
+                res = urlopen(Request(url=convertEndpoint, data=audioData, method='POST', headers= { 'content-type': 'audio/wav' }))
+                audioDataWav = res.read()
+
+                #with open('decoded_image.wav', 'wb') as file_to_save:
+                #    file_to_save.write(audioData)
+
+                audioEndpoint = f"{self.botium_speech_url}/api/stt/{self.botium_speech_language}"
+                logger.debug(f"handle_message - Calling Speech Endpoint: {audioEndpoint}")
+                res = urlopen(Request(url=audioEndpoint, data=audioDataWav, method='POST', headers= { 'content-type': 'audio/wav' }))
+                resJson = json.loads(res.read().decode('utf-8'))
+                logger.debug(f"handle_message - Calling Speech Endpoint: {audioEndpoint} => {resJson}")
+                message = resJson["text"]
+
+                await sio.emit(self.user_message_evt, {"text": message}, room=sid)
+            else:
+                message = data['message']
+
+            message = UserMessage(
+                message, output_channel, sender_id, input_channel=self.name()
+            )
+            await on_new_message(message)
+
+        return socketio_webhook
diff --git a/connectors/rasa/botium/__init__.py b/connectors/rasa/botium/__init__.py
@@ -0,0 +1 @@
+from .SocketIOVoiceInput import SocketIOVoiceInput
diff --git a/connectors/rasa/client/Dockerfile b/connectors/rasa/client/Dockerfile
@@ -0,0 +1,19 @@
+FROM node:lts-alpine
+ARG RASA_ENDPOINT=http://localhost:5005
+ARG RASA_PATH=/socket.io
+ARG PUBLIC_PATH=/
+
+RUN apk add --no-cache --virtual .build-deps curl sed python make g++
+
+WORKDIR /app/
+RUN curl -L -o rvi.zip "https://github.com/RasaHQ/rasa-voice-interface/archive/master.zip" && unzip rvi.zip && rm rvi.zip
+WORKDIR /app/rasa-voice-interface-master
+RUN chown -R node /app/rasa-voice-interface-master \
+  && sed -i "s|'http://localhost:5005'|'${RASA_ENDPOINT}', options: { path: '${RASA_PATH}' }|g" src/main.js \
+  && sed -i "s|integrity: false|integrity: false, publicPath: '${PUBLIC_PATH}'|g" vue.config.js \
+  && npm install --no-optional && npm install serve && npm run-script build
+RUN apk del .build-deps
+
+EXPOSE 8080
+USER node
+CMD PORT=8080 npx serve -s dist
diff --git a/connectors/rasa/client/docker-compose.yml b/connectors/rasa/client/docker-compose.yml
diff --git a/connectors/rasa/credentials.yml b/connectors/rasa/credentials.yml
diff --git a/frontend/resources/.env b/frontend/resources/.env

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+from .SocketIOVoiceInput import SocketIOVoiceInput`