File size: 6,520 Bytes
bd1c43c
4d3af55
 
 
bd1c43c
 
4d3af55
 
bd1c43c
 
 
 
 
 
70de1d6
 
bd1c43c
 
 
4d3af55
bd1c43c
 
4d3af55
 
 
70de1d6
 
bd1c43c
4d3af55
70de1d6
4d3af55
 
b3de037
4d3af55
690cc6d
effcc86
4d3af55
 
 
 
70de1d6
 
 
5b6371b
70de1d6
 
4d3af55
 
 
bd1c43c
 
 
 
4d3af55
bd1c43c
6e1bb73
 
 
4d3af55
 
 
 
 
70de1d6
4d3af55
bd1c43c
70de1d6
 
 
 
4d3af55
 
 
 
 
 
 
 
bd1c43c
4d3af55
 
bd1c43c
4d3af55
 
 
5b6371b
bd1c43c
6e1bb73
4d3af55
 
1a7b0d4
 
6e1bb73
4d3af55
bd1c43c
 
 
4d3af55
 
 
 
 
 
98b5e62
 
4d3af55
70de1d6
 
 
 
 
4d3af55
 
 
 
70de1d6
4d3af55
690cc6d
 
4d3af55
f66623b
 
bfa8620
f66623b
690cc6d
6e1bb73
0ce0c17
8d56dde
4d3af55
 
b3de037
4d3af55
 
2bca5f7
4d3af55
98b5e62
effcc86
690cc6d
4d3af55
b3de037
 
bfa8620
b3de037
 
 
5b6371b
bd1c43c
4d3af55
 
 
 
 
 
 
 
 
fcfd230
bd1c43c
4d3af55
 
 
 
 
 
 
 
 
 
 
70de1d6
4d3af55
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
import argparse
import queue
import time
import threading
import logging
import os

from PIL import Image

from daily import EventHandler, CallClient, Daily
from datetime import datetime
from dotenv import load_dotenv

from auth import get_meeting_token, get_room_name
from pipeline import Pipeline
from device import device, torch_dtype

load_dotenv()

class DailyVision(EventHandler):
    def __init__(
        self,
        room_url,
        room_name,
        expiration,
        idle,
        bot_name="Daily Bot"
    ):
        self.__client = CallClient(event_handler=self)
        self.__pipeline = Pipeline
        self.__camera = None
        self.__time = time.time()
        #self.__queue = queue.Queue()
        self.__app_quit = False
        self.__image_buffer = None
        self.__params_buffer = Pipeline.InputParams()
        self.__bot_name = bot_name
        self.__room_url = room_url
        self.__room_name = room_name
        self.__expiration = expiration
        self.__idle = idle

        # Create the pipeline (this might take a moment)
        self.__params = Pipeline.InputParams()
        self.__pipeline = Pipeline(device, torch_dtype)
        #print(self.__pipeline.InputParams.schema())

        # Configure logger
        FORMAT = f"%(asctime)s {self.__room_url} %(message)s"
        logging.basicConfig(format=FORMAT)
        self.logger = logging.getLogger("bot-instance")
        self.logger.setLevel(logging.DEBUG)

        self.logger.info(f"Expiration timer set to: {self.__expiration}")

         # Setup camera
        self.setup_camera()

    def run(self, meeting_url, token):
        # Join
        self.logger.info(f"Connecting to room {meeting_url} as {self.__bot_name}")
        self.__client.set_user_name(self.__bot_name)
        self.__client.join(meeting_url, token, completion=self.on_joined)
        
        #self.__participant_id = self.client.participants()["local"]["id"]

        # Start thread
        self.__thread = threading.Thread(target = self.process_frames)
        self.__thread.start()

        # Keep-alive on thread
        self.__thread.join()
 
    def leave(self):
        self.logger.info(f"Leaving...")
        self.__app_quit = True
        self.__thread.join()
        self.__client.leave()

    def on_joined(self, join_data, client_error):
        self.logger.info(f"call_joined: {join_data}, {client_error}")

    def on_participant_joined(self, participant):
        self.logger.info(f"Participant {participant['id']} joined, analyzing frames...")
        self.wave()
        self.__client.set_video_renderer(participant["id"], self.on_video_frame, color_format="RGB") 

    def setup_camera(self):
        if not self.__camera:
            self.__camera = Daily.create_camera_device("camera",
                                                       width = 640,
                                                       height = 480,
                                                       color_format="RGB")
            self.__client.update_inputs({
                "camera": {
                    "isEnabled": True,
                    "settings": {
                        "deviceId": "camera"
                    }
                }
            })

    def process_frames(self):
        params = self.__params
        
        while not self.__app_quit:
            # Is anyone watching?
            if not self.__idle and len(self.__client.participants()) < 2:
                self.logger.info(f"No partcipants in channel. Exiting...")
                self.__app_quit = True
                break
            # Check expiry timer
            if time.time() > self.__expiration:
                self.logger.info(f"Expiration timer exceeded. Exiting...")
                self.__app_quit = True
                break
            try:
                #video_frame = self.__queue.get(timeout=5)
                video_frame = self.__image_buffer

                if self.__params_buffer:
                    print("New buffer params found")
                    params = self.__params_buffer
                    self.__params_buffer = None
                if not video_frame == None:
                    image = Image.frombytes("RGB", (video_frame.width, video_frame.height), video_frame.buffer)
                    result_image = self.__pipeline.predict(params, image)
                    self.__camera.write_frame(result_image.tobytes())
            except queue.Empty:
                pass
            
    def on_video_frame(self, participant_id, video_frame):
        # Process ~15 frames per second (considering incoming frames at 30fps).
        if time.time() - self.__time > float(os.getenv("FPS_CAP", 0.0333)):
            self.__time = time.time()
            
            self.__image_buffer = video_frame
            #self.__queue.put(video_frame)

    def on_app_message(self, message, sender):
        # Update pipeline settings based on message data
        self.__params_buffer = self.__pipeline.InputParams(**message)
        return

    def wave(self):
        self.__client.send_app_message(self.__params.model_dump_json())

def main():
    parser = argparse.ArgumentParser(description="Daily Bot")
    # Required args
    parser.add_argument("-u", "--url", required=True, type=str, help="URL of the Daily room")
    parser.add_argument("-k", "--api_key", required=True, type=str, help="Daily API key")
    # Optional args
    parser.add_argument("-t", "--private", type=bool, help="Is this room private?", default=True)
    parser.add_argument("-n", "--bot-name", type=str, help="Name of the bot", default="Daily Bot")
    parser.add_argument("-e", "--expiration", type=int, help="Duration of bot", default=os.getenv("BOT_MAX_DURATION", 300))
    parser.add_argument("-i", "--idle", type=bool, help="Wait for participants to join", default=os.getenv("BOT_WILL_IDLE", False))
    args = parser.parse_args()
    
    Daily.init()

    expiration = time.time() + args.expiration
    room_name = get_room_name(args.url)

    # Retrieve a meeting token, if not provided 
    #@TODO do room lookup to check privacy
    if args.private:
        token = get_meeting_token(room_name, args.api_key, expiration)

    app = DailyVision(args.url, room_name, expiration, args.idle, args.bot_name)
    
    try :
        app.run(args.url, token)
    except KeyboardInterrupt:
        print("Ctrl-C detected. Exiting!")
    finally:
        app.leave()

    # Let leave finish
    time.sleep(2)

if __name__ == '__main__':
    main()