File size: 17,460 Bytes
5acd9c3
 
 
 
 
59e0f6a
5acd9c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59e0f6a
 
 
 
 
 
 
 
 
 
 
 
 
5acd9c3
 
59e0f6a
5acd9c3
59e0f6a
 
 
5acd9c3
 
 
 
 
 
 
 
 
 
 
 
59e0f6a
5acd9c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59e0f6a
5acd9c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
import asyncio
import json
import logging
import os
import pathlib
import time
from aiohttp import web, WSMsgType
from typing import Dict, Any
from api_core import VideoGenerationAPI

from api_config import *

# Configure logging
logging.basicConfig(
    level=logging.INFO,
    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
)
logger = logging.getLogger(__name__)

async def process_generic_request(data: dict, ws: web.WebSocketResponse, api) -> None:
    """Handle general requests that don't fit into specialized queues"""
    try:
        request_id = data.get('requestId')
        action = data.get('action')
        
        def error_response(message: str):
            return {
                'action': action,
                'requestId': request_id,
                'success': False,
                'error': message
            }

        if action == 'heartbeat':
            # Include user role info in heartbeat response
            user_role = getattr(ws, 'user_role', 'anon')
            await ws.send_json({
                'action': 'heartbeat',
                'requestId': request_id,
                'success': True,
                'user_role': user_role
            })
        
        elif action == 'get_user_role':
            # Return the user role information
            user_role = getattr(ws, 'user_role', 'anon')
            await ws.send_json({
                'action': 'get_user_role',
                'requestId': request_id,
                'success': True,
                'user_role': user_role
            })
        
        elif action == 'generate_caption':
            title = data.get('params', {}).get('title')
            description = data.get('params', {}).get('description')
            
            if not title or not description:
                await ws.send_json(error_response('Missing title or description'))
                return
                
            caption = await api.generate_caption(title, description)
            await ws.send_json({
                'action': action,
                'requestId': request_id,
                'success': True,
                'caption': caption
            })
            
        elif action == 'generate_thumbnail':
            title = data.get('params', {}).get('title')
            description = data.get('params', {}).get('description')
            
            if not title or not description:
                await ws.send_json(error_response('Missing title or description'))
                return
                
            thumbnail = await api.generate_thumbnail(title, description)
            await ws.send_json({
                'action': action,
                'requestId': request_id,
                'success': True,
                'thumbnailUrl': thumbnail
            })
            
        else:
            await ws.send_json(error_response(f'Unknown action: {action}'))
            
    except Exception as e:
        logger.error(f"Error processing generic request: {str(e)}")
        try:
            await ws.send_json({
                'action': data.get('action'),
                'requestId': data.get('requestId'),
                'success': False,
                'error': f'Internal server error: {str(e)}'
            })
        except Exception as send_error:
            logger.error(f"Error sending error response: {send_error}")

async def process_search_queue(queue: asyncio.Queue, ws: web.WebSocketResponse, api):
    """Medium priority queue for search operations"""
    while True:
        try:
            data = await queue.get()
            request_id = data.get('requestId')
            query = data.get('query', '').strip()
            search_count = data.get('searchCount', 0)
            attempt_count = data.get('attemptCount', 0)

            logger.info(f"Processing search request: query='{query}', search_count={search_count}, attempt={attempt_count}")

            if not query:
                logger.warning(f"Empty query received in request: {data}")
                result = {
                    'action': 'search',
                    'requestId': request_id,
                    'success': False,
                    'error': 'No search query provided'
                }
            else:
                try:
                    search_result = await api.search_video(
                        query,
                        search_count=search_count,
                        attempt_count=attempt_count
                    )
                    
                    if search_result:
                        logger.info(f"Search successful for query '{query}' (#{search_count})")
                        result = {
                            'action': 'search',
                            'requestId': request_id,
                            'success': True,
                            'result': search_result
                        }
                    else:
                        logger.warning(f"No results found for query '{query}' (#{search_count})")
                        result = {
                            'action': 'search',
                            'requestId': request_id,
                            'success': False,
                            'error': 'No results found'
                        }
                except Exception as e:
                    logger.error(f"Search error for query '{query}' (#{search_count}, attempt {attempt_count}): {str(e)}")
                    result = {
                        'action': 'search',
                        'requestId': request_id,
                        'success': False,
                        'error': f'Search error: {str(e)}'
                    }

            await ws.send_json(result)
            
        except Exception as e:
            logger.error(f"Error in search queue processor: {str(e)}")
            try:
                error_response = {
                    'action': 'search',
                    'requestId': data.get('requestId') if 'data' in locals() else None,
                    'success': False,
                    'error': f'Internal server error: {str(e)}'
                }
                await ws.send_json(error_response)
            except Exception as send_error:
                logger.error(f"Error sending error response: {send_error}")
        finally:
            if 'queue' in locals():
                queue.task_done()

async def process_chat_queue(queue: asyncio.Queue, ws: web.WebSocketResponse):
    """High priority queue for chat operations"""
    while True:
        data = await queue.get()
        try:
            api = ws.app['api']
            if data['action'] == 'join_chat':
                result = await api.handle_join_chat(data, ws)
            elif data['action'] == 'chat_message':
                result = await api.handle_chat_message(data, ws)
            elif data['action'] == 'leave_chat':
                result = await api.handle_leave_chat(data, ws)
            await ws.send_json(result)
        except Exception as e:
            logger.error(f"Error processing chat request: {e}")
            try:
                await ws.send_json({
                    'action': data['action'],
                    'requestId': data.get('requestId'),
                    'success': False,
                    'error': f'Chat error: {str(e)}'
                })
            except Exception as send_error:
                logger.error(f"Error sending error response: {send_error}")
        finally:
            queue.task_done()

async def process_video_queue(queue: asyncio.Queue, ws: web.WebSocketResponse):
    """Process multiple video generation requests in parallel"""
    active_tasks = set()
    MAX_CONCURRENT = len(VIDEO_ROUND_ROBIN_ENDPOINT_URLS)  # Match client's max concurrent generations

    async def process_single_request(data):
        try:
            api = ws.app['api']
            title = data.get('title', '')
            description = data.get('description', '')
            video_prompt_prefix = data.get('video_prompt_prefix', '')
            options = data.get('options', {})
            
            # Get the user role from the websocket
            user_role = getattr(ws, 'user_role', 'anon')
            
            # Pass the user role to generate_video
            video_data = await api.generate_video(title, description, video_prompt_prefix, options, user_role)
            
            result = {
                'action': 'generate_video',
                'requestId': data.get('requestId'),
                'success': True,
                'video': video_data,
            }
            
            await ws.send_json(result)
            
        except Exception as e:
            logger.error(f"Error processing video request: {e}")
            try:
                await ws.send_json({
                    'action': 'generate_video',
                    'requestId': data.get('requestId'),
                    'success': False,
                    'error': f'Video generation error: {str(e)}'
                })
            except Exception as send_error:
                logger.error(f"Error sending error response: {send_error}")
        finally:
            active_tasks.discard(asyncio.current_task())

    while True:
        # Clean up completed tasks
        active_tasks = {task for task in active_tasks if not task.done()}
        
        # Start new tasks if we have capacity
        while len(active_tasks) < MAX_CONCURRENT:
            try:
                # Use try_get to avoid blocking if queue is empty
                data = await asyncio.wait_for(queue.get(), timeout=0.1)
                
                # Create and start new task
                task = asyncio.create_task(process_single_request(data))
                active_tasks.add(task)
                
            except asyncio.TimeoutError:
                # No items in queue, break inner loop
                break
            except Exception as e:
                logger.error(f"Error creating video generation task: {e}")
                break

        # Wait a short time before checking queue again
        await asyncio.sleep(0.1)

        # Handle any completed tasks' errors
        for task in list(active_tasks):
            if task.done():
                try:
                    await task
                except Exception as e:
                    logger.error(f"Task failed with error: {e}")
                active_tasks.discard(task)

async def status_handler(request: web.Request) -> web.Response:
    """Handler for API status endpoint"""
    api = request.app['api']
    
    # Get current busy status of all endpoints
    endpoint_statuses = []
    for ep in api.endpoint_manager.endpoints:
        endpoint_statuses.append({
            'id': ep.id,
            'url': ep.url,
            'busy': ep.busy,
            'last_used': ep.last_used,
            'error_count': ep.error_count,
            'error_until': ep.error_until
        })
    
    return web.json_response({
        'product': PRODUCT_NAME,
        'version': PRODUCT_VERSION,
        'maintenance_mode': MAINTENANCE_MODE,
        'available_endpoints': len(VIDEO_ROUND_ROBIN_ENDPOINT_URLS),
        'endpoint_status': endpoint_statuses,
        'active_endpoints': sum(1 for ep in endpoint_statuses if not ep['busy'] and ('error_until' not in ep or ep['error_until'] < time.time()))
    })

async def websocket_handler(request: web.Request) -> web.WebSocketResponse:
    # Check if maintenance mode is enabled
    if MAINTENANCE_MODE:
        # Return an error response indicating maintenance mode
        return web.json_response({
            'error': 'Server is in maintenance mode',
            'maintenance': True
        }, status=503)  # 503 Service Unavailable
    
    ws = web.WebSocketResponse(
        max_msg_size=1024*1024*20,  # 20MB max message size
        timeout=30.0  # we want to keep things tight and short
    )
    
    ws.app = request.app
    await ws.prepare(request)
    api = request.app['api']
    
    # Get the Hugging Face token from query parameters
    hf_token = request.query.get('hf_token', '')
    
    # Validate the token and determine the user role
    user_role = await api.validate_user_token(hf_token)
    logger.info(f"User connected with role: {user_role}")
    
    # Store the user role in the websocket
    ws.user_role = user_role

    # Create separate queues for different request types
    chat_queue = asyncio.Queue()
    video_queue = asyncio.Queue()
    search_queue = asyncio.Queue()
    
    # Start background tasks for handling different request types
    background_tasks = [
        asyncio.create_task(process_chat_queue(chat_queue, ws)),
        asyncio.create_task(process_video_queue(video_queue, ws)),
        asyncio.create_task(process_search_queue(search_queue, ws, api))
    ]

    try:
        async for msg in ws:
            if msg.type == WSMsgType.TEXT:
                try:
                    data = json.loads(msg.data)
                    action = data.get('action')
                    
                    # Route requests to appropriate queues
                    if action in ['join_chat', 'leave_chat', 'chat_message']:
                        await chat_queue.put(data)
                    elif action in ['generate_video']:
                        await video_queue.put(data)
                    elif action == 'search':
                        await search_queue.put(data)
                    else:
                        await process_generic_request(data, ws, api)
                        
                except Exception as e:
                    logger.error(f"Error processing WebSocket message: {str(e)}")
                    await ws.send_json({
                        'action': data.get('action') if 'data' in locals() else 'unknown',
                        'success': False,
                        'error': f'Error processing message: {str(e)}'
                    })
                    
            elif msg.type in (WSMsgType.ERROR, WSMsgType.CLOSE):
                break
                
    finally:
        # Cleanup
        for task in background_tasks:
            task.cancel()
        try:
            await asyncio.gather(*background_tasks, return_exceptions=True)
        except asyncio.CancelledError:
            pass
    
    return ws

async def init_app() -> web.Application:
    app = web.Application(
        client_max_size=1024**2*20  # 20MB max size
    )
    
    # Create API instance
    api = VideoGenerationAPI()
    app['api'] = api
    
    # Add cleanup logic
    async def cleanup_api(app):
        # Add any necessary cleanup for the API
        pass
    
    app.on_shutdown.append(cleanup_api)
    
    # Add routes
    app.router.add_get('/ws', websocket_handler)
    app.router.add_get('/api/status', status_handler)
    
    # Set up static file serving
    # Define the path to the public directory
    public_path = pathlib.Path(__file__).parent / 'build' / 'web'
    if not public_path.exists():
        public_path.mkdir(parents=True, exist_ok=True)
    
    # Set up static file serving with proper security considerations
    async def static_file_handler(request):
        # Get the path from the request (removing leading /)
        path_parts = request.path.lstrip('/').split('/')
        
        # Convert to safe path to prevent path traversal attacks
        safe_path = public_path.joinpath(*path_parts)
        
        # Make sure the path is within the public directory (prevent directory traversal)
        try:
            safe_path = safe_path.resolve()
            if not str(safe_path).startswith(str(public_path.resolve())):
                return web.HTTPForbidden(text="Access denied")
        except (ValueError, FileNotFoundError):
            return web.HTTPNotFound()
        
        # If path is a directory, look for index.html
        if safe_path.is_dir():
            safe_path = safe_path / 'index.html'
        
        # Check if the file exists
        if not safe_path.exists() or not safe_path.is_file():
            # If not found, serve index.html (for SPA routing)
            safe_path = public_path / 'index.html'
            if not safe_path.exists():
                return web.HTTPNotFound()
        
        # Determine content type based on file extension
        content_type = 'text/plain'
        ext = safe_path.suffix.lower()
        if ext == '.html':
            content_type = 'text/html'
        elif ext == '.js':
            content_type = 'application/javascript'
        elif ext == '.css':
            content_type = 'text/css'
        elif ext in ('.jpg', '.jpeg'):
            content_type = 'image/jpeg'
        elif ext == '.png':
            content_type = 'image/png'
        elif ext == '.gif':
            content_type = 'image/gif'
        elif ext == '.svg':
            content_type = 'image/svg+xml'
        elif ext == '.json':
            content_type = 'application/json'
        
        # Return the file with appropriate headers
        return web.FileResponse(safe_path, headers={'Content-Type': content_type})
    
    # Add catch-all route for static files (lower priority than API routes)
    app.router.add_get('/{path:.*}', static_file_handler)
    
    return app

if __name__ == '__main__':
    app = asyncio.run(init_app())
    web.run_app(app, host='0.0.0.0', port=8080)