Talk2Care-Backend/client.py at main · jrcz-data-science-lab/Talk2Care-Backend · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
import sounddevice as sd
import numpy as np
from scipy.io.wavfile import write, read
import base64
import tempfile
import requests
import time
import sys
import threading
import os

SERVER_URL = "http://145.19.54.110:8000/general"
SAMPLERATE = 48000
CHANNELS = 1

recording = []
is_recording = False


def callback(indata, frames, time_info, status):
    global recording
    if status:
        print(status)
    recording.append(indata.copy())


def record_audio_live():
    global recording, is_recording
    recording = []
    print("Recording... press ENTER again to stop.")
    with sd.InputStream(samplerate=SAMPLERATE, channels=CHANNELS, dtype="int16", callback=callback):
        while is_recording:
            sd.sleep(100)
    print("Recording stopped.")


def play_audio(audio_np, samplerate=SAMPLERATE):
    try:
        sd.play(audio_np, samplerate=samplerate)
        sd.wait()
    except Exception as e:
        print("Playback error:", e)


def audio_to_base64(audio_np, samplerate=SAMPLERATE):
    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmpfile:
        write(tmpfile.name, samplerate, audio_np)
        with open(tmpfile.name, "rb") as f:
            audio_bytes = f.read()
    os.remove(tmpfile.name)
    return base64.b64encode(audio_bytes).decode("utf-8")


def base64_to_audio(audio_b64):
    audio_bytes = base64.b64decode(audio_b64)
    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmpfile:
        tmpfile.write(audio_bytes)
        tmpfile.flush()
        samplerate, data = read(tmpfile.name)
    os.remove(tmpfile.name)
    return data, samplerate


def generate_silence(duration=1.0, samplerate=SAMPLERATE):
    return np.zeros((int(duration * samplerate), 1), dtype=np.int16)


def send_audio(username, audio_b64, scenario, feedback=False):
    data = {
        "username": username,
        "audio": audio_b64,
        "feedback": feedback,
        "scenario": scenario,
        "is_initial_request": False
    }

    try:
        response = requests.post(SERVER_URL, json=data, timeout=500)

        # Always try JSON first
        if response.headers.get("Content-Type", "").startswith("application/json"):
            resp_json = response.json()

            # 🔴 New validation handling
            if resp_json.get("validation") is False:
                print("❌ Validation failed:", resp_json.get("errorMessage", "Unknown error"))
                return None

            # ✅ Normal audio response
            audio_field = resp_json.get("audio")
            if not audio_field:
                print("⚠️ No audio field in response:", resp_json)
                return None

            return audio_field

        else:
            print("Unexpected response type:", response.text)
            return None

    except requests.exceptions.RequestException as e:
        print("Error sending request:", e)
        return None


def main():
    global is_recording, recording

    username = input("Enter your username: ").strip()

    scenario = input("Enter scenario number (e.g. 1, 2, 3...): ").strip()

    print("\n=== Push-to-Talk Online Mode ===")
    print("Press ENTER to start recording, ENTER again to stop.")
    print("Audio will be sent to the server and the reply will play.")
    print("Press Ctrl+C to exit.\n")

    try:
        while True:
            input("Press ENTER to start recording...")
            is_recording = True
            rec_thread = threading.Thread(target=record_audio_live)
            rec_thread.start()

            input("")
            is_recording = False
            rec_thread.join()

            if not recording:
                print("No audio captured. Try again.")
                continue

            audio_np = np.concatenate(recording, axis=0)
            audio_b64 = audio_to_base64(audio_np)

            print("Sending audio to server...")
            audio_b64_resp = send_audio(username, audio_b64, scenario, feedback=False)

            if audio_b64_resp:
                print("Playing server response...")
                server_audio_np, sr = base64_to_audio(audio_b64_resp)
                play_audio(server_audio_np, sr)
            else:
                print("No audio received from server.")

            print("\n--- Ready for next round ---\n")
            time.sleep(0.5)

    except KeyboardInterrupt:
        print("\nConversation ended. Requesting feedback summary from server...")

        silent_audio = generate_silence()
        silent_b64 = audio_to_base64(silent_audio)

        # Send feedback request and get full response
        data = {
            "username": username,
            "audio": silent_b64,
            "feedback": True,
            "scenario": scenario
        }

        try:
            response = requests.post(SERVER_URL, json=data, timeout=60)
            response.raise_for_status()

            if response.headers.get("Content-Type", "").startswith("application/json"):
                feedback_json = response.json()
                audio_field = feedback_json.get("audio")

                if audio_field:
                    print("=== Feedback Summary ===")
                    try:
                        feedback_audio, sr = base64_to_audio(audio_field)
                        play_audio(feedback_audio, sr)
                    except Exception as e:
                        print(f"Error playing audio: {e}")

                    # Display speech metrics and icon states if available
                    if "speech_metrics" in feedback_json:
                        print("\n=== Speech Metrics ===")
                        metrics = feedback_json["speech_metrics"]
                        print(f"Speech Rate (WPM): {metrics.get('speech_rate_wpm', 'N/A')}")
                        print(f"Average Pause: {metrics.get('avg_pause', 'N/A')}s")
                        print(f"Filler Count: {metrics.get('filler_count', 'N/A')}")
                        print(f"Filler Ratio: {metrics.get('filler_ratio', 'N/A')}%")

                    if "icon_states" in feedback_json:
                        print("\n=== Icon States (for Unreal Engine) ===")
                        icons = feedback_json["icon_states"]
                        print(f"Speech Rate: {icons.get('speech_rate', 'N/A')}")
                        print(f"Pauses: {icons.get('pauses', 'N/A')}")
                        print(f"Fillers: {icons.get('fillers', 'N/A')}")
                        print(f"Overall: {icons.get('overall', 'N/A')}")
                    if "speech_summary" in feedback_json:
                        print(f"\n{feedback_json['speech_summary']}")

                    # Display Gordon pattern analysis if available
                    if "gordon_patterns" in feedback_json:
                        print("\n=== Gordon Pattern Analysis ===")
                        patterns = feedback_json["gordon_patterns"]
                        print(f"Covered Patterns: {patterns.get('covered_patterns', 0)}/11")
                        print(f"Coverage Percentage: {patterns.get('coverage_percentage', 0)}%")
                        if patterns.get("mentioned_patterns"):
                            print(f"Mentioned Patterns: {patterns.get('mentioned_patterns', [])}")
                        if patterns.get("summary"):
                            print(f"\n{patterns.get('summary', '')}")
                else:
                    print("No audio in feedback response.")
                    print("Full response:", feedback_json)
            else:
                print("Unexpected response format:", response.text[:200])
        except Exception as e:
            print(f"Error requesting feedback: {e}")

        print("\nGoodbye!")
        sys.exit(0)


if __name__ == "__main__":
    main()