# ================================
# KAG Configuration File
# ================================

# ----------------
# Knowledge Graph Builder
# ----------------
knowledge_graph_builder:
  prompt_dir: ./core/prompts
  doc_type: "screenplay"         # options: screenplay / novel
  max_workers: 32                # maximum number of parallel workers

# ----------------
# Event & Plot Graph Builder
# ----------------
event_plot_graph_builder:
  max_workers: 24
  max_depth: 2                   # maximum distance for node-pair consideration
  check_weakly_connected_components: true   # check weakly connected components when breaking cycles
  min_connected_component_size: 10          # minimum size of weakly connected component
  max_num_triangles: 2000
  max_iterations: 5
  min_confidence: 0.5             # minimum confidence threshold
  event_fallback: [Action, Goal]  # fallback event types

# ----------------
# Schema Probing
# ----------------
probing:
  probing_mode: adjust            # options: fixed / adjust / from_scratch
  refine_background: true
  task_goal: ./core/schema/default_task_goals.txt
  max_workers: 32
  max_retries: 2
  default_graph_schema_path: ./core/schema/default_graph_schema.json
  default_background_path: ./examples/settings/we2_settings.json
  experience_limit: 100
  relation_prune_threshold: 0.01
  entity_prune_threshold: 0.02

# ----------------
# LLM Settings
# ----------------
llm:
  provider: openai
  model_name: Qwen3-235B-A22B-FP8
  api_key: sk-<YOUR_API_KEY>      # replace with your API key
  base_url: http://115.190.15.46:30000/v1
  temperature: 0.0
  max_tokens: 8096
  enable_thinking: true
  timeout: 60

# Alternative LLM config example:
# llm:
#   provider: openai
#   model_name: qwen3-32b
#   api_key: not-needed
#   base_url: http://localhost:8096/v1
#   temperature: 0.0
#   max_tokens: 8096
#   enable_thinking: true
#   timeout: 60

# ----------------
# Graph Embeddings
# ----------------
graph_embedding:
  provider: openai
  model_name: bge-m3
  api_key: not-needed
  base_url: http://localhost:8080/v1
  max_tokens: 8192
  dimensions: 1024
  timeout: 60

# ----------------
# Vector DB Embeddings
# ----------------
vectordb_embedding:
  provider: openai
  model_name: bge-m3
  api_key: not-needed
  base_url: http://localhost:8080/v1
  max_tokens: 8192
  dimensions: 1024
  timeout: 60

# ----------------
# Reranking
# ----------------
rerank:
  provider: cohere
  model_name: Qwen3-Reranker-8B
  api_key: not-needed
  base_url: http://localhost:8012/v1
  timeout: 120

# ----------------
# Document Processing
# ----------------
document_processing:
  chunk_size: 500                 # chunk size (characters or tokens)
  chunk_overlap: 0                # overlap between chunks
  max_workers: 32
  max_segments: 3
  max_content_size: 2000

# ----------------
# Agent Settings
# ----------------
agent:
  max_workers: 32
  score_threshold: 7
  max_retries: 2
  async_timeout: 600
  async_max_attempts: 3
  async_backoff_seconds: 60

# ----------------
# Memory
# ----------------
memory:
  enabled: true
  memory_type: vector
  max_token_limit: 4000
  memory_path: ./data/memory
  history_memory_size: 3
  insight_memory_size: 10

# ----------------
# Storage
# ----------------
storage:
  # Graph database (Neo4j)
  neo4j_uri: bolt://localhost:7687
  neo4j_username: neo4j
  neo4j_password: <YOUR_PASSWORD>
  
  # Vector database
  vector_store_type: chroma
  vector_store_path: data/vector_store

  # Knowledge graph outputs
  knowledge_graph_path: data/knowledge_graph
  
  # Event & plot graph outputs
  event_plot_graph_path: data/event_plot_graph

  # Schema storage
  graph_schema_path: data/graph_schema

  # Relational database (SQL)
  sql_database_path: data/sql
