agl_service_voiceagent/client.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81

# SPDX-License-Identifier: Apache-2.0
#
# Copyright (c) 2023 Malik Talha
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import time
import grpc
from agl_service_voiceagent.generated import voice_agent_pb2
from agl_service_voiceagent.generated import voice_agent_pb2_grpc

def run_client(server_address, server_port, mode, nlu_engine, recording_time):
    SERVER_URL = server_address + ":" + server_port
    nlu_engine = voice_agent_pb2.RASA if nlu_engine == "rasa" else voice_agent_pb2.SNIPS
    print("Starting Voice Agent Client...")
    print(f"Client connecting to URL: {SERVER_URL}")
    with grpc.insecure_channel(SERVER_URL) as channel:
        print("Press Ctrl+C to stop the client.")
        print("Voice Agent Client started!")
        if mode == 'wake-word':
            stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
            print("[+] Listening for wake word...")
            wake_request = voice_agent_pb2.Empty()
            wake_results = stub.DetectWakeWord(wake_request)
            wake_word_detected = False
            for wake_result in wake_results:
                print("Wake word status: ", wake_word_detected)
                if wake_result.status:
                    print("Wake word status: ", wake_result.status)
                    wake_word_detected = True
                    break

        elif mode == 'auto':
            raise ValueError("[-] Auto mode is not implemented yet.")

        elif mode == 'manual':
            stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
            print("[+] Recording voice command in manual mode...")
            record_start_request = voice_agent_pb2.RecognizeControl(action=voice_agent_pb2.START, nlu_model=nlu_engine, record_mode=voice_agent_pb2.MANUAL)
            response = stub.RecognizeVoiceCommand(iter([record_start_request]))
            stream_id = response.stream_id

            time.sleep(recording_time) # pause here for the number of seconds passed by user or default 5 seconds

            record_stop_request = voice_agent_pb2.RecognizeControl(action=voice_agent_pb2.STOP, nlu_model=nlu_engine, record_mode=voice_agent_pb2.MANUAL, stream_id=stream_id)
            record_result = stub.RecognizeVoiceCommand(iter([record_stop_request]))
            print("[+] Voice command recording ended!")
            
            status = "Uh oh! Status is unknown."
            if record_result.status == voice_agent_pb2.REC_SUCCESS:
                status = "Yay! Status is success."
            elif record_result.status == voice_agent_pb2.VOICE_NOT_RECOGNIZED:
                status = "Voice not recognized."
            elif record_result.status == voice_agent_pb2.INTENT_NOT_RECOGNIZED:
                status = "Intent not recognized."

            # Process the response
            print("Status:", status)
            print("Command:", record_result.command)
            print("Intent:", record_result.intent)
            intent_slots = []
            for slot in record_result.intent_slots:
                print("Slot Name:", slot.name)
                print("Slot Value:", slot.value)
                i_slot = voice_agent_pb2.IntentSlot(name=slot.name, value=slot.value)
                intent_slots.append(i_slot)
            
            if record_result.status == voice_agent_pb2.REC_SUCCESS:
                print("[+] Executing voice command...")
                exec_voice_command_request = voice_agent_pb2.ExecuteInput(intent=record_result.intent, intent_slots=intent_slots)
                response = stub.ExecuteVoiceCommand(exec_voice_command_request)