agl_service_voiceagent/client.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122

# SPDX-License-Identifier: Apache-2.0
#
# Copyright (c) 2023 Malik Talha
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import time
import grpc
from agl_service_voiceagent.generated import voice_agent_pb2
from agl_service_voiceagent.generated import voice_agent_pb2_grpc

def run_client(server_address, server_port, action, mode, nlu_engine, recording_time):
    SERVER_URL = server_address + ":" + server_port
    nlu_engine = voice_agent_pb2.RASA if nlu_engine == "rasa" else voice_agent_pb2.SNIPS
    print("Starting Voice Agent Client...")
    print(f"Client connecting to URL: {SERVER_URL}")
    with grpc.insecure_channel(SERVER_URL) as channel:
        print("Press Ctrl+C to stop the client.")
        print("Voice Agent Client started!")
        if action == 'GetStatus':
            stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
            print("[+] Checking status...")
            status_request = voice_agent_pb2.Empty()
            status_result = stub.CheckServiceStatus(status_request)
            print("Version:", status_result.version)
            print("Status:", status_result.status)
            print("Wake Word:", status_result.wake_word)

        elif action == 'DetectWakeWord':
            stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
            print("[+] Listening for wake word...")
            wake_request = voice_agent_pb2.Empty()
            wake_results = stub.DetectWakeWord(wake_request)
            wake_word_detected = False
            for wake_result in wake_results:
                print("Wake word status: ", wake_word_detected)
                if wake_result.status:
                    print("Wake word status: ", wake_result.status)
                    wake_word_detected = True
                    break
        
        elif action == 'ExecuteVoiceCommand':
            if mode == 'auto':
                raise ValueError("[-] Auto mode is not implemented yet.")

            elif mode == 'manual':
                stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
                print("[+] Recording voice command in manual mode...")
                record_start_request = voice_agent_pb2.RecognizeVoiceControl(action=voice_agent_pb2.START, nlu_model=nlu_engine, record_mode=voice_agent_pb2.MANUAL)
                response = stub.RecognizeVoiceCommand(iter([record_start_request]))
                stream_id = response.stream_id

                time.sleep(recording_time) # pause here for the number of seconds passed by user or default 5 seconds

                record_stop_request = voice_agent_pb2.RecognizeVoiceControl(action=voice_agent_pb2.STOP, nlu_model=nlu_engine, record_mode=voice_agent_pb2.MANUAL, stream_id=stream_id)
                record_result = stub.RecognizeVoiceCommand(iter([record_stop_request]))
                print("[+] Voice command recording ended!")
                
                status = "Uh oh! Status is unknown."
                if record_result.status == voice_agent_pb2.REC_SUCCESS:
                    status = "Yay! Status is success."
                elif record_result.status == voice_agent_pb2.VOICE_NOT_RECOGNIZED:
                    status = "Voice not recognized."
                elif record_result.status == voice_agent_pb2.INTENT_NOT_RECOGNIZED:
                    status = "Intent not recognized."

                # Process the response
                print("Status:", status)
                print("Command:", record_result.command)
                print("Intent:", record_result.intent)
                intent_slots = []
                for slot in record_result.intent_slots:
                    print("Slot Name:", slot.name)
                    print("Slot Value:", slot.value)
                    i_slot = voice_agent_pb2.IntentSlot(name=slot.name, value=slot.value)
                    intent_slots.append(i_slot)
                
                if record_result.status == voice_agent_pb2.REC_SUCCESS:
                    print("[+] Executing voice command...")
                    exec_voice_command_request = voice_agent_pb2.ExecuteInput(intent=record_result.intent, intent_slots=intent_slots)
                    response = stub.ExecuteCommand(exec_voice_command_request)

        elif action == 'ExecuteTextCommand':
            text_input = input("[+] Enter text command: ")
            
            stub = voice_agent_pb2_grpc.VoiceAgentServiceStub(channel)
            recognize_text_request = voice_agent_pb2.RecognizeTextControl(text_command=text_input, nlu_model=nlu_engine)
            response = stub.RecognizeTextCommand(recognize_text_request)

            status = "Uh oh! Status is unknown."
            if response.status == voice_agent_pb2.REC_SUCCESS:
                status = "Yay! Status is success."
            elif response.status == voice_agent_pb2.NLU_MODEL_NOT_SUPPORTED:
                status = "NLU model not supported."
            elif response.status == voice_agent_pb2.INTENT_NOT_RECOGNIZED:
                status = "Intent not recognized."

            # Process the response
            print("Status:", status)
            print("Command:", response.command)
            print("Intent:", response.intent)
            intent_slots = []
            for slot in response.intent_slots:
                print("Slot Name:", slot.name)
                print("Slot Value:", slot.value)
                i_slot = voice_agent_pb2.IntentSlot(name=slot.name, value=slot.value)
                intent_slots.append(i_slot)

            if response.status == voice_agent_pb2.REC_SUCCESS:
                    print("[+] Executing voice command...")
                    exec_text_command_request = voice_agent_pb2.ExecuteInput(intent=response.intent, intent_slots=intent_slots)
                    response = stub.ExecuteCommand(exec_text_command_request)