CEIEF/config.yaml at main · chengYu23/CEIEF · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
# CEIEF Project Configuration
# Cultural Education Interaction Enhancement Framework
#
# Copy this file and fill in your actual values:
#   cp config.yaml config.local.yaml
# Then set environment variable: CEIEF_CONFIG=config.local.yaml
# OR copy .env.example to .env and fill in secrets.

# ============================================================
# LLM Configuration
# ============================================================
llm:
  provider: anthropic
  api_key: "${ANTHROPIC_API_KEY}"      # Set via environment variable
  base_url: "${ANTHROPIC_BASE_URL}"    # e.g. https://api.anthropic.com
  model: "claude-sonnet-4-6"           # or claude-3-5-sonnet-20241022
  max_tokens: 2048
  temperature: 0.7
  top_p: 0.9
  timeout: 60
  retry_attempts: 3
  retry_delay: 2

# ============================================================
# Neo4j Knowledge Graph Configuration
# ============================================================
neo4j:
  uri: "${NEO4J_URI}"                  # e.g. bolt://localhost:7687
  user: "${NEO4J_USER}"               # e.g. neo4j
  password: "${NEO4J_PASSWORD}"        # Set via environment variable
  database: "neo4j"
  max_connection_pool_size: 50
  connection_timeout: 30

# ============================================================
# Knowledge Graph Retrieval Settings
# ============================================================
kg_retrieval:
  # TopK triples returned per retrieval query
  top_k: 10
  max_triples_per_query: 10
  # Cosine similarity threshold — also used as second-hop trigger boundary
  similarity_metric: "cosine"
  similarity_threshold: 0.60
  # Hop depth: default 1-hop; second-hop expansion fires when
  # mean similarity < second_hop_threshold OR a required context slot is unresolved
  max_hop_depth: 2
  second_hop_threshold: 0.60        # triggers two-hop expansion
  # Sentence encoder for query–triple semantic retrieval
  # Paper setting: BAAI/bge-m3 (multilingual dense retrieval encoder)
  embedding_model: "BAAI/bge-m3"
  use_semantic_search: true
  fallback_to_keyword: true

# ============================================================
# Agent Controller Settings
# ============================================================
agent:
  policy: "rule_based"   # options: rule_based, ml_based, hybrid
  action_selection: "deterministic"  # options: deterministic, stochastic
  state_window_size: 5
  confusion_threshold: 0.4
  exploration_rate: 0.1
  actions:
    - evidence_expansion
    - role_anchoring
    - perspective_contrast
    - reflective_prompting
    - clarification
    - simplification
    - summary_closure

# ============================================================
# Dialogue Settings
# ============================================================
dialogue:
  max_turns: 20
  session_timeout: 3600
  memory_window: 10
  language: "zh"
  role_profiles:
    - museum_guide
    - cultural_teacher
    - historical_interpreter
    - value_mediator

# ============================================================
# Experiment Settings
# ============================================================
experiment:
  conditions:
    - llm_only
    - kg_llm
    - llm_agent
    - full_ceief
  repetitions_per_condition: 20
  task_families:
    - historical_explanation
    - event_interpretation
    - norm_comparison
    - value_conflict_mediation
    - contemporary_transfer
  random_seed: 42
  output_dir: "logs/"
  # tasks_per_family × task_families = total tasks
  tasks_per_family: 4               # 4 tasks per task family
  total_tasks: 20                   # 5 families × 4 tasks

# ============================================================
# Run Policy (Experiment Execution Settings)
# ============================================================
run_policy:
  n_runs_per_condition: 20          # independent runs per experimental condition
  random_seed: 42                   # fixed seed for reproducibility
  batch_size: 1                     # one dialogue episode per batch
  conditions:
    - llm_only
    - kg_llm
    - llm_agent
    - full_ceief

# ============================================================
# Policy Module (RL Agent Policy Configuration)
# ============================================================
policy_module:
  # 15-dimensional state feature vector (see agent/state_feature_schema.json)
  state_dim: 15
  # Softmax policy over the 7 controller actions
  n_actions: 7
  policy_form: "softmax"            # softmax distribution over action logits
  # Episode-level REINFORCE-style gradient update
  update_rule: "REINFORCE"          # policy gradient; episode-level return
  learning_rate: 1.0e-3             # lr = 1e-3
  discount_factor: 0.99             # γ for discounted return
  baseline: "running_mean"          # variance-reduction baseline

# ============================================================
# Reward Design
# ============================================================
reward_design:
  # Weighted composite reward signal
  # Total weight must sum to 1.0
  components:
    semantic_grounding:
      weight: 0.35
      description: "Degree to which the response is grounded in retrieved KG evidence"
    contextual_coherence:
      weight: 0.25
      description: "Coherence of the response with the preceding dialogue context"
    pedagogical_appropriateness:
      weight: 0.25
      description: "Alignment with culturally appropriate pedagogical strategies"
    role_style_fidelity:
      weight: 0.15
      description: "Consistency with the assigned cultural role and language register"

# ============================================================
# Evaluation Settings
# ============================================================
evaluation:
  auto_metrics:
    - cultural_semantic_coherence
    - kg_coverage_ratio
    - response_depth_score
    - action_diversity_index
  human_metrics:
    - historical_context_matching
    - cultural_label_alignment
    - language_style_modal_alignment
  pre_annotation: true
  inter_rater_reliability: true

# ============================================================
# Human Rating Protocol
# ============================================================
human_rating:
  n_raters: 2                       # two trained human raters
  # Raters calibrate on 20 % of the material before formal scoring begins
  calibration_proportion: 0.20
  calibration_description: "Rubric calibration on 20% of items before formal scoring"
  # A third rater arbitrates when two primary raters differ by more than 1 point
  arbitration_threshold: 1          # score difference > 1 triggers third-rater arbitration
  arbitration_rule: "third_rater"   # resolution method
  rating_scale:
    min: 1
    max: 5
  dimensions:
    - historical_context_matching
    - cultural_label_alignment
    - language_style_modal_alignment

# ============================================================
# Logging Settings
# ============================================================
logging:
  level: "INFO"
  log_dir: "logs/"
  dialogue_log: "logs/raw_dialogues/"
  action_log: "logs/controller_actions/"
  retrieval_log: "logs/retrieval_logs/"
  scoring_log: "logs/scoring_outputs/"
  format: "json"
  rotate_size: "100MB"

# ============================================================
# Paths
# ============================================================
paths:
  data_dir: "data/"
  kg_triples: "data/kg/cultural_triples.csv"
  subgraph_examples: "data/kg/subgraph_examples.json"
  entity_schema: "data/ontology/entity_schema.json"
  relation_schema: "data/ontology/relation_schema.json"
  task_bank: "data/tasks/task_bank.json"
  prompts_dir: "prompts/"
  agent_config: "agent/controller_config.yaml"
  action_space: "agent/action_space.json"