CoexistAI/app.py at main · SPThole/CoexistAI · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
from utils.websearch_utils import *
from utils.reddit_utils import *
from utils.map import *
from fastapi import FastAPI, Request
from pydantic import BaseModel
from utils.utils import *
from utils.map import *
from utils.git_utils import *
from utils.startup_banner import display_startup_banner, display_shutdown_banner, get_ascii_banner
from utils.knowledge_base import create_knowledge_base
from utils.crawler_utils import crawl_and_create_kb
import html as _html
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import FileResponse, HTMLResponse
from fastapi.staticfiles import StaticFiles
from uuid import uuid4
import subprocess
from utils.tts_utils import *
from fastapi_mcp import FastApiMCP
import json
import os
import atexit
from model_config import *
import time
from typing import List, Optional, Union
from utils.knowledge_base import create_knowledge_base

# Application state for startup/reload notifications
app_state = {"status": "starting", "message": "Initializing components..."}


def init_components():
    """(Re)initialize model and embedding components from model_config. This is safe to call
    at startup or after config reload. It updates module-level globals used by request handlers.
    """
    global llm, hf_embeddings, cross_encoder, text_splitter, searcher, date, day, llm_model_name, llm_type, llm_kwargs, embedding_model_name, embed_mode, cross_encoder_name

    app_state['status'] = 'starting'
    app_state['message'] = 'Loading models and embeddings (this may take a minute)...'
    print("=== CoexistAI Startup: Loading models and embeddings ===", flush=True)
    try:
        # Read config values
        print("Reading configuration from model_config...", flush=True)
        llm_model_name = model_config.get("llm_model_name", llm_model_name if 'llm_model_name' in globals() else 'google/gemma-3-12b')
        llm_type = model_config.get("llm_type", llm_type if 'llm_type' in globals() else 'local')
        llm_kwargs = model_config.get("llm_kwargs", llm_kwargs if 'llm_kwargs' in globals() else {'temperature':0.1,'api_key': llm_api_key})

        embedding_model_name = model_config.get("embedding_model_name", embedding_model_name if 'embedding_model_name' in globals() else 'models/embedding-001')
        embed_mode = model_config.get("embed_mode", embed_mode if 'embed_mode' in globals() else 'google')
        cross_encoder_name = model_config.get("cross_encoder_name", cross_encoder_name if 'cross_encoder_name' in globals() else 'BAAI/bge-reranker-base')
        print(f"Config loaded: llm_type={llm_type}, llm_model={llm_model_name}, embed_mode={embed_mode}", flush=True)

        # instantiate generative LLM
        print(f"Initializing LLM: {llm_model_name} ({llm_type})...", flush=True)
        llm = get_generative_model(
            model_name=llm_model_name,
            type=llm_type,
            base_url=openai_compatible.get(llm_type, 'https://api.openai.com/v1'),
            _tools=None,
            kwargs=llm_kwargs
        )
        print("LLM initialized successfully", flush=True)

        # load embeddings and cross-encoder
        print(f"Loading embeddings: {embedding_model_name} (mode={embed_mode})...", flush=True)
        hf_embeddings, cross_encoder = load_model(embedding_model_name,
                                                  _embed_mode=embed_mode,
                                                  cross_encoder_name=cross_encoder_name,
                                                  kwargs=model_config.get('embed_kwargs', {}))
        print("Embeddings and cross-encoder loaded successfully", flush=True)

        print("Initializing text splitter...", flush=True)
        text_splitter = TokenTextSplitter(chunk_size=128, chunk_overlap=32)

        # recreate searxng searcher
        print(f"Initializing SearchWeb with {HOST_SEARXNG}:{PORT_NUM_SEARXNG}...", flush=True)
        searcher = SearchWeb(PORT_NUM_SEARXNG, HOST_SEARXNG)

        print("Getting local date and time...", flush=True)
        date, day = get_local_data()

        app_state['status'] = 'ready'
        app_state['message'] = 'Ready'
        print("=== CoexistAI Startup Complete: All components ready ===", flush=True)
    except Exception as e:
        app_state['status'] = 'error'
        app_state['message'] = f'Initialization failed: {e}'
        # keep exception visible in logs
        print(f"=== CoexistAI Startup FAILED: {e} ===", flush=True)
        logger.exception('Failed to initialize components')
        raise


# Initialize components once at import/startup
# (This is now done in the lifespan startup handler)
# try:
#     init_components()
# except Exception as e:
#     # already logged; keep going so admin endpoints can be used to diagnose/fix
#     logger.error(f'Failed to initialize at startup: {e}')
#     # Update status to show startup failed but app is running for diagnostics
#     app_state['status'] = 'error'
#     app_state['message'] = f'Startup failed: {e}'

# Use config values for model and embedding paths
llm_model_name = model_config.get("llm_model_name", 'google/gemma-3-12b')
llm_type = model_config.get("llm_type", 'local')
llm_tools = model_config.get("llm_tools",None)
llm_base_url = openai_compatible.get(model_config['llm_type'],
                                     'https://api.openai.com/v1')


llm_kwargs = model_config.get("llm_kwargs", {'temperature': 0.1,
                                            'max_tokens': None,
                                            'timeout': None,
                                            'api_key':llm_api_key,
                                            'max_retries': 2})

embed_kwargs = model_config.get("embed_kwargs", {})
embedding_model_name = model_config.get("embedding_model_name", "models/embedding-001")
embed_mode = model_config.get("embed_mode", "google")
cross_encoder_name = model_config.get("cross_encoder_name", "BAAI/bge-reranker-base")


if not is_searxng_running():
    # Running `docker` from inside a container is not supported in most environments
    # (docker binary may not exist or there are permission restrictions). Instead,
    # log a clear warning and let orchestration (docker-compose / external admin)
    # manage the searxng service.
    try:
        logger.warning(f"SearxNG not reachable at {HOST_SEARXNG}:{PORT_NUM_SEARXNG}. Please start the searxng service (e.g. `docker compose up searxng`) or ensure it's reachable from this container.")
    except Exception:
        print(f"SearxNG not reachable at {HOST_SEARXNG}:{PORT_NUM_SEARXNG}. Please start searxng service.")
else:
    try:
        logger.info("SearxNG is reachable.")
    except Exception:
        print("SearxNG docker container is already running.")

llm = get_generative_model(
    model_name=llm_model_name,
    type=llm_type,
    base_url=llm_base_url,
    _tools=None,
    kwargs=llm_kwargs
)

hf_embeddings, cross_encoder = load_model(embedding_model_name,
                                          _embed_mode=embed_mode,
                                          cross_encoder_name=cross_encoder_name,
                                          kwargs=embed_kwargs)

text_splitter = TokenTextSplitter(chunk_size=512, chunk_overlap=128)

searcher = SearchWeb(PORT_NUM_SEARXNG, HOST_SEARXNG)
date, day = get_local_data()

# Lifespan context manager for startup/shutdown
from contextlib import asynccontextmanager

@asynccontextmanager
async def lifespan(app_instance):
    # Startup
    print("\n" + "="*80, flush=True)
    print("FastAPI app starting up...", flush=True)
    logger.info("FastAPI app starting up...")
    app_state['status'] = 'starting'
    app_state['message'] = 'Initializing components...'
    try:
        init_components()
        print("="*80 + "\n", flush=True)
    except Exception as e:
        print(f"STARTUP ERROR: {e}", flush=True)
        print("="*80 + "\n", flush=True)
        logger.error(f"Failed to initialize components during startup: {e}", exc_info=True)
        app_state['status'] = 'error'
        app_state['message'] = f'Startup failed: {e}'
    yield
    # Shutdown
    logger.info("FastAPI app shutting down...")
    app_state['status'] = 'shutting_down'
    app_state['message'] = 'App shutting down'

app = FastAPI(title='coexistai', lifespan=lifespan)

# Mount static files
app.mount("/artifacts", StaticFiles(directory="artifacts"), name="artifacts")


# --- Admin endpoints for runtime config reload/update ---------------------------------
from fastapi import HTTPException, Depends


def _check_admin_token(token: str = None):
    # token supplied via header X-Admin-Token or env ADMIN_TOKEN
    # FastAPI dependency will pass header automatically when named 'x_admin_token'
    env_token = os.environ.get('ADMIN_TOKEN')
    if env_token is None:
        # no admin token configured; disallow by default to avoid accidental exposure
        raise HTTPException(status_code=403, detail='Admin actions disabled (no ADMIN_TOKEN set)')
    if token != env_token:
        raise HTTPException(status_code=401, detail='Invalid admin token')
    return True


@app.post('/admin/reload-config')
async def admin_reload_config(request: Request):
    """Reload model config from the configured JSON file. Protected by ADMIN_TOKEN env var.
    Send header 'X-Admin-Token: <token>' to authenticate. Returns the reloaded config on success.
    """
    token = request.headers.get('X-Admin-Token')
    try:
        _check_admin_token(token)
    except HTTPException as e:
        raise e

    try:
        new_cfg = reload_model_config()
    except Exception as e:
        raise HTTPException(status_code=500, detail=f'Failed to reload config: {e}')

    # apply config immediately
    try:
        init_components()
    except Exception as e:
        raise HTTPException(status_code=500, detail=f'Config reloaded but applying failed: {e}')

    return {"status": "ok", "model_config": new_cfg, "app_state": app_state}

@app.post('/admin/update-config')
async def admin_update_config(request: Request):
    """Overwrite the config file with the posted JSON body. Protected by ADMIN_TOKEN.
    Body must be a JSON object compatible with the config schema. Returns saved config on success.
    """
    token = request.headers.get('X-Admin-Token')
    try:
        _check_admin_token(token)
    except HTTPException as e:
        raise e

    try:
        body = await request.json()
    except Exception:
        raise HTTPException(status_code=400, detail='Invalid JSON body')

    cfg_path = os.environ.get('CONFIG_PATH', os.path.join(os.path.dirname(__file__), 'config', 'model_config.json'))
    cfg_dir = os.path.dirname(cfg_path)
    os.makedirs(cfg_dir, exist_ok=True)
    try:
        with open(cfg_path, 'w') as f:
            json.dump(body, f, indent=2)
    except Exception as e:
        raise HTTPException(status_code=500, detail=f'Failed to write config: {e}')

    try:
        new_cfg = reload_model_config(cfg_path)
    except Exception as e:
        raise HTTPException(status_code=500, detail=f'Config saved but reload failed: {e}')

    # apply new config immediately
    try:
        init_components()
    except Exception as e:
        raise HTTPException(status_code=500, detail=f'Config saved but applying failed: {e}')

    return {"status": "ok", "saved": cfg_path, "model_config": new_cfg, "app_state": app_state}

# --------------------------------------------------------------------------------------


@app.get('/admin', response_class=HTMLResponse)
async def admin_page():
    """Serve the static admin UI and inject the ASCII banner at request time.
    The static UI lives at ./static/admin.html so it's easier to edit and keep
    app.py small.
    """
    try:
        static_path = os.path.join(os.path.dirname(__file__), 'static', 'admin.html')
        with open(static_path, 'r', encoding='utf-8') as f:
            html = f.read()
    except Exception as e:
        return HTMLResponse(content=f"<html><body>Error loading admin UI: {e}</body></html>", status_code=500)

    # inject the ascii banner into the HTML, escaped for safety
    try:
        banner = get_ascii_banner() or ''
        banner_html = _html.escape(banner)
        html = html.replace('BANNER_PLACEHOLDER', banner_html)
    except Exception:
        pass
    return HTMLResponse(content=html)


@app.get('/status')
async def status():
        """Return basic app startup/reload status for UI and health checks."""
        return app_state


@app.get('/admin/config')
async def admin_get_config():
    """Return the effective model_config plus helper globals for the admin UI."""
    # safe copy of model
    # include openai_compatible and host/port defaults
    def _mask(s):
        try:
            if not s:
                return ''
            s = str(s)
            if len(s) <= 6:
                return '*' * len(s)
            return s[:3] + '...' + s[-3:]
        except Exception:
            return ''

    cfg = dict(model_config)
    cfg['_meta'] = {
        'openai_compatible': openai_compatible,
        'HOST_APP': globals().get('HOST_APP'),
        'PORT_NUM_APP': globals().get('PORT_NUM_APP'),
        'HOST_SEARXNG': globals().get('HOST_SEARXNG'),
        'PORT_NUM_SEARXNG': globals().get('PORT_NUM_SEARXNG'),
        'llm_api_key': _mask(globals().get('llm_api_key')),
        'embed_api_key': _mask(globals().get('embed_api_key')),
    }
    return cfg

# Register shutdown handler
atexit.register(display_shutdown_banner)

origins = [
    "*",  # Allow all origins (use specific domains in production)
]

app.add_middleware(
    CORSMiddleware,
    allow_origins=origins,  # e.g. ["http://localhost", "http://localhost:3000"]
    allow_credentials=True,
    allow_methods=["*"],    # Allow all HTTP methods (including OPTIONS)
    allow_headers=["*"],    # Allow all headers
)

@app.get('/')
async def root():
    return {"message": "Welcome to CoexistAI!"}

class WebSearchRequest(BaseModel):
    query: str
    rerank: bool = True
    num_results: int = 2
    local_mode: bool = False
    split: bool = True
    document_paths: list[str] = []  # List of paths for local documents
    vectordb: str = ""  # Optional vector database name to use instead of search
    quick_answer: bool = False  # Whether to force quick answer mode (disables summary mode)

class YouTubeSearchRequest(BaseModel):
    query: str
    prompt: str
    n: int = 1  # Number of videos to summarize, default is 1

class RedditSearchRequest(BaseModel):
    subreddit: str = None
    url_type: str = "hot"
    n: int = 3
    k: int = 1
    custom_url: str = None
    time_filter: str = "all"
    search_query: str = None
    sort_type: str = "relevance"

class MapSearchRequest(BaseModel):
    start_location: Optional[str] = None  # Start location can be a string or None
    end_location: Optional[str] = None  # End location can be a string or None
    pois_radius: int = 500  # Default radius for POIs in meters
    amenities: str = "restaurant|cafe|bar|hotel"  # Default amenities to search for
    limit: int = 3  # Default number of results to return
    task: str = "route_and_pois"  # Default task is to find a route

class WebSummarizeRequest(BaseModel):
    query: str
    url: str
    local_mode: bool = False

class GitTreeRequest(BaseModel):
    repobaseurl: str

class GitSearchRequest(BaseModel):
    repobaseurl: str
    parttoresearch: str
    query: str
    type: str

class LocalFolderTreeRequest(BaseModel):
    folder_path:str
    level: str = 'broad-first'
    prefix: str = ''

class ResearchCheckRequest(BaseModel):
    query: str
    toolsshorthand: str  # Default budget for deep research, can be adjusted as needed

class ClickableElementRequest(BaseModel):
    url:str
    query:str
    topk:int=10

class PodcastRequest(BaseModel):
    text: str = None
    prompt: str = None  # Optional theme for the podcast

class BasicTTSRequest(BaseModel):
    text: str = None
    voice: str = "am_santa"
    lang: str = "en-us"
    filename: str = ""

class KnowledgeBaseRequest(BaseModel):
    document_paths: list[str]  # List of paths to create knowledge base from

class CrawlerRequest(BaseModel):
    url_or_urls: Union[str, List[str]]  # Single URL to crawl or list of URLs to scrape
    keywords: Optional[List[str]] = [""]  # Optional keywords to filter content
    depth: Optional[int] = None  # Crawl depth for crawling (None for full website crawl)
    crawl: bool = True  # Whether to crawl (True) or process URLs directly (False)
    min_delay: float = 1.0  # Minimum delay between requests in seconds
    max_delay: float = 2.0  # Maximum delay between requests in seconds
    max_pages: int = 10000  # Maximum number of pages to collect during crawling
    url_keyword: Optional[str] = ""  # Optional keyword to filter URLs by presence in the URL string

@app.post('/clickable-elements', operation_id="get_website_structure")
async def get_website_structure(request: ClickableElementRequest):
    """
    Retrieves the top-k clickable elements from a given URL based on a query.
    This will help you to find out if there are any clickable elements on the page that match the query.
    You can use this to find deeper links since connected pieces of information are often linked together.
    RECOMMENDATION: Be specific with the query to get the most relevant clickable elements.
    Args:
        url (str): The URL to search for clickable elements.
        query (str): The query to filter the clickable elements.
        topk (int): The number of top clickable elements to return.
    Returns:
        list: A list of dictionaries containing the title, URL, and score of each clickable element.
    """
    return await get_topk_bm25_clickable_elements(request.url, request.query, request.topk)

@app.post('/local-folder-tree', operation_id="get_local_folder_tree")
async def get_local_folder_tree(request: LocalFolderTreeRequest):
    """
    Async Markdown folder tree.
    Args:
        folder_path (str): Root directory.
        level (str):
            - 'full': Show all folders and files, recursively, except hidden/system/cache entries.
            - 'broad-first': Only show immediate (top-level) folders and files (no nesting).
            - 'broad-second': Show top-level folders/files and their immediate child folders/files (two levels, no deeper).
        prefix (str): Indentation (internal)
    Returns:
        str: Markdown tree string
    """
    return await folder_tree(request.folder_path, level=request.level, prefix=request.prefix)

@app.post('/git-tree-search',operation_id="get_git_tree")
async def get_git_tree(request:GitTreeRequest):
   """
    Retrieves and returns the directory tree structure of a GitHub repository or a local Git repository.

    Args:
        url (str): The base URL of the GitHub repository (e.g., 'https://github.com/user/repo')
                   or the path to the local repository on your system.

    Returns:
        str: The directory tree structure as a string.
    """
   return await git_tree_search(request.repobaseurl)

@app.post('/git-search',operation_id="get_git_search")
async def get_git_search(request:GitSearchRequest):
   """
    Fetches the content of a specific part (directory or file) from either and does what asked in users query.
    First use get_git_tree to understand the structure of the repo and which part might be useful to answer users query
    - a GitHub repository (via URL), or
    - a local Git repository (via local path).

    Args:
        base_url (str): The base URL of the GitHub repository (e.g., 'https://github.com/user/repo'),
                        or the local path to the root of the repository.
        part (str): The path inside the repository you wish to access (e.g., 'basefolder/subfolder'). use get_git_tree for getting specific part if needed
        query (str): Users query
        type (str): "Folder" or "file"
    Returns:
        str: Response of the users query based on the content fetched
    """
   content = await git_specific_content(request.repobaseurl,request.parttoresearch,request.type)
   prompt = f"""You are a professional coder, your task is to answer the users query based on the content fetched from git repo
User Query: {request.query}
Fetched Content: {content}
"""

   result = await llm.ainvoke(
        prompt
    )
   return result.content

@app.post('/web-search',operation_id="get_web_search")
async def websearch(request: WebSearchRequest):
    """
    Performs a web search and retrieves results, then generates a response based on those results.
    It also throws back the next steps, you should carry out your research until there are no next steps left.
    RECOMMENDATION: Be specific with the query to get the most relevant results. and Set num_results to 2 (for better results)
    Args:
        query (str): The input query.
        rerank (bool): Whether to rerank results.
        num_results (int, optional): Number of search results to retrieve. Defaults to 3. (can take values from 1-5)
        document_paths (list of str, optional): List of paths for local documents/folders. Defaults to empty list. for an example [path1,path2,path3]. if different tasks are related to different documents
        local_mode (bool, optional): Whether to process local documents. Defaults to False.
        split (bool, optional): Whether to split documents into chunks. Defaults to True.
        vectordb (str, optional): Name of an existing vector database to query instead of performing search. Defaults to None.
        quick_answer (bool, optional): Whether to force quick answer mode (disables summary mode). Defaults to False.

    Returns:
        str: Generated response to query based on the retrieved and reranked search results and sources
    """
    # You may need to adjust these arguments based on your actual setup
    # For demonstration, using None for models and embeddings
    try:
        result = await query_web_response(
            query=request.query,
            date=date,
            day=day,
            websearcher=searcher,  # Replace with your actual searcher instance if needed
            hf_embeddings=hf_embeddings,
            rerank=request.rerank,
            cross_encoder=cross_encoder,
            model=llm,
            text_model=llm,
            num_results=min(2,request.num_results),
            document_paths=request.document_paths,
            local_mode=request.local_mode,
            split=request.split,
            vectordb=request.vectordb,
            quick_answer=request.quick_answer
        )
        return "result:" + result[0] + '\n\nsources:' + result[1]
    except:
        return "No Websites found, Try rephrasing query"

@app.post('/create-knowledge-base', operation_id="get_knowledge_base")
async def create_kb(request: KnowledgeBaseRequest):
    """
    Creates a knowledge base from the provided document paths.
    Processes all files in the paths, embeds them, and saves to a vector database.

    Args:
        document_paths (list of str): List of paths to folders or files to include in the knowledge base.

    Returns:
        str: The name of the created vector database collection.
    """
    try:
        collection_name = await create_knowledge_base(
            document_paths=request.document_paths,
            hf_embeddings=hf_embeddings
        )
        return f"Knowledge base created successfully. Collection name: {collection_name}"
    except Exception as e:
        return f"Error creating knowledge base: {str(e)}"

@app.post('/crawl-and-create-knowledge-base', operation_id="get_crawled_knowledge_base")
async def crawl_kb(request: CrawlerRequest):
    """
    Crawls a website or processes a list of URLs and creates a knowledge base from the content.

    Args:
        url_or_urls: Single URL to crawl or list of URLs to scrape directly
        keywords: Optional list of keywords to filter content by
        depth: Maximum crawl depth for crawling (None for full website crawl)
        crawl: Whether to crawl (True) or process URLs directly (False)
        min_delay: Minimum delay between requests in seconds (default: 1.0)
        max_delay: Maximum delay between requests in seconds (default: 3.0)
        max_pages: Maximum number of pages to collect during crawling (default: 100)
        url_keyword: Optional keyword to filter URLs by presence in the URL string

    Returns:
        str: Message with the collection name and list of scraped URLs.
    """
    try:
        collection_name, scraped_urls = await crawl_and_create_kb(
            url_or_urls=request.url_or_urls,
            keywords=request.keywords,
            depth=request.depth,
            crawl=request.crawl,
            min_delay=request.min_delay,
            max_delay=request.max_delay,
            max_pages=request.max_pages,
            url_keyword=request.url_keyword,
            hf_embeddings=hf_embeddings
        )
        return f"Crawled knowledge base created successfully. Collection name: {collection_name}. Scraped URLs: {scraped_urls}"
    except Exception as e:
        return f"Error creating crawled knowledge base: {str(e)}"

@app.post('/web-summarize', operation_id="get_web_summarize")
async def websummarize(request: WebSummarizeRequest):
    """Generates a summary of a web page based on the provided query and URL.
    Args:
        query (str): The input query.
        url (str): The URL of the web page to summarize.
        model (str): The model to use for summarization.
        local_mode (bool): Whether to process local documents.
    Returns:
        str:  The generated summary of the url provided to answer query"""
    try:
        result = await summary_of_url(
            query=request.query,
            url=request.url,
            model=llm,  # Replace with your actual model if needed
            local_mode=request.local_mode
        )
        return result
    except:
        return "URL is not reacheable, try different URL"

@app.post('/youtube-search', operation_id="get_youtube_search")
async def youtube_search(request: YouTubeSearchRequest):
    """Performs a YouTube search and return summaries of it.
    Args:
        query (str): The YouTube video URL if provided else search term
        prompt (str): The prompt to generate a response from the transcript.
        n (int): Number of videos to summarize if search term is provided instead of URL.
    Returns:
        str: response from the YouTube transcripts based on the given query"""
    # You may need to adjust the model argument as per your setup
    result = youtube_transcript_response(
        request.query,
        request.prompt,
        n = request.n, #number of videos to summarise
        model=llm  # Replace with your actual model if needed
    )
    return result

@app.post('/reddit-search', operation_id="get_reddit_search")
async def reddit_search(request: RedditSearchRequest):
    """Performs a Reddit search and retrieves posts based on the provided parameters.
    Args:
        subreddit (str): The subreddit to search in. When search_query is provided
        url_type (str): The type of Reddit URL to fetch (e.g., 'search','hot', 'new','top','best','controversial','rising').
                        set to 'search' if specific search_query is provided
        n (int): Number of posts to retrieve.
        k (int): Number of comments on each post to return after processing. When more perspectives needed increase this.
        custom_url (str): Custom URL for Reddit search.
        time_filter (str): Time filter for the search (e.g., 'all', 'day').
        search_query (str): Search query for Reddit posts. IF NOT SEARCHING FOR A QUERY, dont set this value, keep it ""
        sort_type (str): Sorting type for the results.
        Returns:
            str: A response containing the summary of the Reddit search results"""
    # You may need to adjust the model argument as per your setup
    if request.search_query:
        request.url_type = 'search'
    result = reddit_reader_response(
        subreddit=request.subreddit,
        url_type=request.url_type,
        n=request.n,
        k=request.k,
        custom_url=request.custom_url,
        time_filter=request.time_filter,
        search_query=request.search_query,
        sort_type=request.sort_type,
        model=llm  # Replace with your actual model if needed
    )
    return result

@app.post('/map-search', operation_id="get_map_search")
async def map_search(request: MapSearchRequest):
    """Performs a map search and retrieves the route and points of interest like  (POIs) between two locations.
    Args:
        start_location (optional str): The starting location for the route. can be None as well
        end_location (optional str): The destination location for the route.can be None as well
        pois_radius (int): Radius in meters to search for points of interest around the route.
        amenities (str): Types of amenities to search for, separated by '|'. For example, "restaurant|cafe|bar|hotel".
        limit (int): Maximum number of POIs to return.
        task (str): The task to perform, either "location_only" - if lat long of start and end location is needed,
            else by default is "route_and_pois" - if route and POIs are needed.
    Returns:
        dict: location or route and POIs or both"""
    result = generate_map(request.start_location,
                        request.end_location,
                        pois_radius=request.pois_radius,
                        amenities=request.amenities,
                        limit=request.limit,
                        task=request.task,
                        )
    return result

@app.post('/check-response', operation_id="get_response_check")
async def check_response(request: ResearchCheckRequest):
    """
    Evaluates whether the agent's collected information is complete for writing answer to the user's query.
    If any aspect is missing, list them all in bullet format
    Args:
        query (str): The user's original query.
        toolsshorthand (str):  Exact Facts/Information collected in bullets from every past tool usage which would be useful to answer
    Returns:
        str: Suggestions for improvement or confirmation that all aspects are addressed.
    """
    system_prompt = f"""You are a professional researcher.
Review the following user query and the agent's short hand of informations collected.
If not explicitly asked for deep research, you should just check if most necessary information and all aspects present in query are covered, NO NEED TO SUGGEST EXTRA, SINCE ITS QUICK QUERY
Determine if the shorthand fully addresses every aspect and intent of the query.
If any part is missing or could be improved, list the specific aspects or suggestions for further research or value addition.(IF DEEP RESEARCH ASKED EXPLICITLY)
If the response is complete, state that all aspects have been addressed.

User Query: {request.query}
Agent Shorthand: {request.toolsshorthand}
"""

    result = await llm.ainvoke(
        system_prompt
    )
    return result.content

@app.post('/text-to-podcast', operation_id="get_podcast")
async def podcaster(request: PodcastRequest):
    """
    Converts a list of sentences with specified voices into a podcast audio file.
    Each sentence is spoken in the specified voice, and random pauses are added between sentences for natural flow.

    Args:
        prompt: The theme or topic of the podcast episode. You can even provide length instructions, like shorter/longer duration, tone, etc.
        text: The detailed content over which the podcast is to be made.
    Returns:
        FileResponse: The generated podcast .wav file. or str
    """
    system_prompt = f"""You are an experienced podcaster who can create engaging episodes on any topic.
Your style makes complex concepts simple, clear, and enjoyable to listen to.

When writing scripts:

Use natural, conversational language.

Avoid special characters (like *, #, etc.) and TTS markup (such as <prosody> tags).

Do not include background descriptions or stage directions.

Always stay on the provided theme (if one is given). If no theme is provided, use the given text to generate engaging, informative content.

The podcast script should be formatted as follows:

<podcast>
[Person1] What Person1 says [Person2] What Person2 says ...
</podcast>


Where each [Person] represents a speaker, followed by their dialogue.

Theme: {request.prompt}
Text: {request.text}
"""

    result = await llm.ainvoke(
        system_prompt
    )
    voice_choices = ["af_heart","am_michael","am_adam","am_eric","am_echo","am_puck",
                     "am_fenrir","am_santa","am_liam","af_river"
                     ]
    podcast_segments = await parse_podcast(result.content, voice_choices)

    try:
        if os.path.exists("output/podcasts") is False:
            os.makedirs("output/podcasts")
        file_path = f"output/podcasts/podcast_{str(uuid4())[:8]}.wav"
        _ = await podcasting(podcast_segments, filename=file_path)
        logger.info(f"Current working directory: {os.getcwd()}")

        logger.info(f"Podcast file created at: {file_path}")
        try:
            return FileResponse(
            file_path,
            media_type="audio/wav",
            filename=os.path.basename(file_path)
            )
        except:
            return f"Generated podcast and stored at {file_path}"
    except Exception as e:
        return {"error": f"Error occurred while creating podcast: {e}"}

@app.post('/basic-tts', operation_id="get_basic_tts")
async def basic_tts(request: BasicTTSRequest):
    """Converts input text to speech using the specified voice and language, and returns the generated audio file.
    Args:
        request (BasicTTSRequest): The request object containing the following fields:
            - text (str): The text to be converted to speech.
            - voice (str): The voice to use for speech synthesis.
            - lang (str): The language code for speech synthesis.
            - filename (str, optional): The output filename for the generated audio file.
    Returns:
        FileResponse: The generated audio file in WAV format if successful.
        dict: An error message if text is not provided or if an exception occurs during TTS generation.
    """
    text = request.text
    voice = request.voice
    lang = request.lang
    filename = request.filename

    if not filename:
        filename = f"output/basic_tts_{str(uuid4())[:8]}.wav"

    if not text:
        return {"error": "Text is required for TTS."}

    try:
        await text_to_speech(text, voice, filename, lang)
        return FileResponse(
            filename,
            media_type="audio/wav",
            filename=os.path.basename(filename)
        )
    except Exception as e:
        return {"error": f"Error occurred while creating TTS: {e}"}


mcp = FastApiMCP(app,include_operations=['get_web_search',
                                         'get_web_summarize',
                                         'get_youtube_search',
                                         'get_reddit_search',
                                         'get_map_search',
                                         "get_git_tree",
                                         "get_git_search",
                                         "get_local_folder_tree",
                                         "get_response_check",
                                         "get_website_structure",
                                         "get_podcast",
                                         "get_basic_tts"
                                         ],)
mcp.mount()

# Display startup banner when the app starts
display_startup_banner(host=HOST_APP, port=PORT_NUM_APP)