RAG Service

Chat Test

Your primary workspace for testing Flexible Chat and Multimodal interactions with comprehensive testing tools.
API Version 2.2.1 Updated 2025-10-02 Config resources/configs/development_config.yml
Launch Unified Test

Service Health Status

Run quick or deep checks to validate config, upstream AOAI, and dependencies.
Disabled
Loading service health…
Last checked: Never

Testing

Test your RAG and Chat endpoints with interactive interfaces and comprehensive validation tools.
Test RAG retrieval, chat conversations, and multimodal capabilities with real-time validation.

Ingestion

Upload documents to build or update your knowledge base. Supports async processing with status tracking.

Documentation

Access API documentation and interactive docs.
Explore endpoints, schemas, and usage examples.

Endpoint Status

Features: Flexible enabledMultimodal enabledFeedback enabled

Enabled: health, flexible, experiments, upload, knowledge, functions_health, search_admin, ingestion, doc_center, feedback

Disabled: None

Configuration Snapshot

Pretty-printed configuration (safe view).
Show Config (YAML)
app:
  name: MyChatApp
  deployment: production
  function_app_url: https://func-aichat-test-msba.azurewebsites.net
  api:
    title: RAG Service
    version: 2.2.1
    description: RAG Service API
    contact:
      name: API Support
      email: support@example.com
      url: null
    license:
      name: MIT
      url: https://opensource.org/licenses/MIT
    terms_of_service: https://example.com/terms
    servers:
    - url: http://127.0.0.1:8000
      description: Development server
      variables: null
    - url: https://api.example.com
      description: Production server
      variables: null
    docs_url: /api/docs
    openapi_url: /api/openapi.json
    redoc_url: /api/redoc
    prefix: /api
    enabled_endpoints:
    - health
    - flexible
    - experiments
    - upload
    - knowledge
    - functions_health
    - search_admin
    - ingestion
    - doc_center
    - feedback
    templates_dir: rag_api_core/templates
    static_dir: rag_api_core/static
    static_url: /static
    debug: null
    host: 0.0.0.0
    port: 8000
    reload: null
    workers: 1
    cors_enabled: true
    cors_origins:
    - http://localhost:3000
    - http://127.0.0.1:3000
    - https://yourdomain.com
    cors_methods:
    - GET
    - POST
    - PUT
    - DELETE
    cors_headers:
    - Content-Type
    - Authorization
    - X-API-Key
    max_request_size: 16777216
    timeout: 30
    access_log: true
    log_level: null
    features:
      feedback_collection_enabled: true
      ab_testing_enabled: false
      custom_metrics_enabled: true
    feedback: null
  fetchers:
    RestAPIFetcher:
      processor: flatten_user_dict
      params:
        base_url: https://jsonplaceholder.typicode.com
        token: ''
    AzureSearchFetcher:
      processor: noop
      params:
        query: ''
        filter: ''
        top_k: 5
        skip: 0
        include_total_count: true
        facets:
        - type,count:5
        highlight_fields:
        - text
        search_fields:
        - text
        - section_title
        select_fields:
        - id
        - source_file
        - file_type
        - page_number
        - sheet_name
        - table_name
        - chunk_index
        - type
        - text
        - section_title
        - subsection_title
        semantic: true
        semantic_config: default-semantic
        vector_search: true
        hybrid: null
        vector_field: contentVector
      metadata_fields:
      - source_file
      - page_number
      - type
      - sheet_name
      - table_name
  models:
    llms:
      default_alias: default
      models:
        default:
          provider: azure
          deployment: ChatModelLM
          api_base_url: https://kanev-mf4a5d70-swedencentral.cognitiveservices.azure.com/
          api_version: 2024-12-01-preview
          azure_endpoint: null
          use_managed_identity: false
          api_key: <hidden>
          endpoint: <hidden>
          model: gpt-5-chat
          model_name: gpt-5-chat
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        oai_gpt4o:
          provider: openai
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: gpt-4o-mini
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_claude:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: anthropic/claude-3.5-sonnet
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_claude_opus:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: anthropic/claude-3-opus
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_claude_sonnet_4:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: anthropic/claude-sonnet-4
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_gemini:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: google/gemini-2.5-flash
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_gemini_pro:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: google/gemini-2.5-flash
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_gpt4o:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: openai/gpt-4o
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_gpt5:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: openai/gpt-5-chat
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: true
        or_llama:
          provider: openrouter
          deployment: null
          api_base_url: null
          api_version: null
          azure_endpoint: null
          use_managed_identity: true
          api_key: <hidden>
          endpoint: <hidden>
          model: meta-llama/llama-3.1-8b-instruct
          model_name: null
          params:
            max_tokens: 6000
            temperature: 0.2
            top_p: 0.9
            frequency_penalty: 0.0
            presence_penalty: 0.0
            stop: []
            repetition_penalty: null
            n: 1
            stream: false
            logit_bias: null
            reasoning_effort: null
          prompts: null
          supports_multimodal: false
      defaults:
        prompts: null
        params:
          max_tokens: 2000
          temperature: null
          top_p: null
          frequency_penalty: null
          presence_penalty: null
          stop: []
          repetition_penalty: null
          n: null
          stream: null
          logit_bias: {}
          reasoning_effort: null
    embeddings:
      default_alias: null
      models:
        default:
          endpoint: <hidden>
          vectorizer_base_url: null
          url: null
          deployment: EmbeddingModelADA002
          model_name: text-embedding-ada-002
          api_version: '2023-05-15'
          api_key: <hidden>
          use_managed_identity: false
      defaults: null
  index: null
  ai_search:
    index: null
    indexes:
      private:
        name: private_text_index
        skillset_name: null
        indexer_name: null
        indexes_path: resources/AI_search_indexes
        index_yml_path: private_text_index.yml
        vector_dim: 1536
        vector_field: contentVector
        index_text_field: text
        filename_field: source_file
        semantic_content_fields:
        - text
        - section_title
        semantic_title_field: section_title
      public:
        name: unified_text_index
        skillset_name: null
        indexer_name: null
        indexes_path: resources/AI_search_indexes
        index_yml_path: text_index.yml
        vector_dim: 1536
        vector_field: contentVector
        index_text_field: text
        filename_field: source_file
        semantic_content_fields:
        - text
        - section_title
        semantic_title_field: section_title
    default_index: public
    endpoint: <hidden>
    api_key: <hidden>
    use_managed_identity: false
    metadata_fields:
    - source_file
    - video_url
    - timestamp
    - speaker
    - topic
    - keyword
    - questionoranswer
  storage:
    blob_storage:
      account_name: saaichatdevservicet
      use_managed_identity: true
      endpoint_suffix: core.windows.net
      prompts_storage:
        container_name: prompts
        directories:
          experiments: experiments
          response_templates: response_templates
          system_prompts: system_prompts
        defaults:
          response_template: default_prompt.j2
          system_prompt: system_prompt.j2
      file_mappings:
        base_container: conversionfiles
        file_type_mappings:
          .pdf: pdf/raw
          .txt: transcripts/raw
          .docx: docs/raw
          .xlsx: data/raw
          .csv: data/raw
          .json: data/raw
          .pptx: presentations/raw
          .mp4: video/raw
          .mp3: audio/raw
          .wav: audio/raw
          .png: images/raw
          .jpg: images/raw
          .jpeg: images/raw
        default_directory: other/raw
        case_insensitive: true
    file_share:
      account_name: saaichatdevservicet
      share_name: shared-files
      directory_path: uploads
      use_managed_identity: true
      endpoint_suffix: core.windows.net
    table_storage:
      account_name: saaichatdevservicet
      table_name: ingestion
      use_managed_identity: true
      endpoint_suffix: core.windows.net
    queue_storage:
      account_name: saaichatdevservicet
      queue_name: document-processing
      use_managed_identity: true
      endpoint_suffix: core.windows.net
    default_account_name: saaichatdevservicet
    default_resource_group: DEV-Test-Services
    default_subscription_id: 45729ecb-461f-42d8-a1d4-988cbc9f09c8
  form_recognizer:
    endpoint: <hidden>
    api_version: 2023-02-28-preview
    model_id: prebuilt-document
    pages_per_call: 100
    api_key: <hidden>
  secrets_mapping: null
  experiments:
    enabled: false
    experiments:
      prompt_optimization:
        name: System Prompt Optimization
        status: inactive
        traffic_split: 0
        variants:
          control:
            name: Original Prompt
            prompt_path: prompts/recovered_space/system_prompt.j2
            weight: 50
          treatment:
            name: Enhanced Prompt
            prompt_path: prompts/recovered_space/enhanced_system_prompt.j2
            weight: 50
        success_metrics:
        - user_satisfaction
        - response_relevance
        - task_completion
        enabled: false
  other:
    debug: true
    log_level: INFO
    telemetry_enabled: null
    environment: null
    custom_setting: null
  ingestion: null