Codified_Decision_Tree/codified_decision_tree.py at main · KomeijiForce/Codified_Decision_Tree · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
import os
import openai
import re, json, jsonlines, pickle
import numpy as np
import torch
import torch.nn.functional as F
from sentence_transformers import SentenceTransformer
from transformers import AutoTokenizer, AutoModelForCausalLM, AutoModelForSequenceClassification
from collections import defaultdict
from constant import openai_key
from copy import deepcopy
from datasets import load_dataset
from nltk import word_tokenize, sent_tokenize
from collections import Counter, defaultdict
from tqdm import tqdm
from sklearn.cluster import KMeans
from openai import OpenAI

# character = "Kasumi"
# engine = "gpt-4.1"
# discriminator_path = "KomeijiForce/deberta-v3-base-rp-nli"
# surface_embedder_path, generator_embedder_path = "Qwen/Qwen3-Embedding-8B", "Qwen/Qwen3-8B"
# max_depth, threshold_accept, threshold_reject, threshold_filter = 3, 0.8, 0.5, 0.8
# device_id = 1

import argparse

def build_arg_parser():
    parser = argparse.ArgumentParser(
        description="Run CDT building with configurable model and thresholds"
    )

    # Core model / character settings
    parser.add_argument(
        "--character",
        type=str,
        default="Kasumi",
        help="Target character name"
    )
    parser.add_argument(
        "--engine",
        type=str,
        default="gpt-4.1",
        help="LLM engine name"
    )

    # Model paths
    parser.add_argument(
        "--discriminator_path",
        type=str,
        default="KomeijiForce/deberta-v3-base-rp-nli",
        help="Path or name of discriminator model"
    )
    parser.add_argument(
        "--surface_embedder_path",
        type=str,
        default="Qwen/Qwen3-Embedding-8B",
        help="Embedding model for surface encoding"
    )
    parser.add_argument(
        "--generator_embedder_path",
        type=str,
        default="Qwen/Qwen3-8B",
        help="Embedding / generator backbone model"
    )

    # Control parameters
    parser.add_argument(
        "--max_depth",
        type=int,
        default=3,
        help="Maximum reasoning / recursion depth"
    )
    parser.add_argument(
        "--threshold_accept",
        type=float,
        default=0.8,
        help="Acceptance threshold"
    )
    parser.add_argument(
        "--threshold_reject",
        type=float,
        default=0.5,
        help="Rejection threshold"
    )
    parser.add_argument(
        "--threshold_filter",
        type=float,
        default=0.8,
        help="Filtering threshold"
    )

    # Device
    parser.add_argument(
        "--device_id",
        type=int,
        default=1,
        help="CUDA device id"
    )

    return parser

args = build_arg_parser().parse_args()

character = args.character
engine = args.engine

discriminator_path = args.discriminator_path
surface_embedder_path = args.surface_embedder_path
generator_embedder_path = args.generator_embedder_path

max_depth = args.max_depth
threshold_accept = args.threshold_accept
threshold_reject = args.threshold_reject
threshold_filter = args.threshold_filter

device_id = args.device_id

device = torch.device(f"cuda:{device_id}")

openai.api_key = openai_key
client = OpenAI(api_key=openai_key)

all_characters = json.load(open("all_characters.json"))
character2artifact = {character:artifact for artifact in all_characters for character in all_characters[artifact]["major"]}
band2members = json.load(open("band2members.json"))
leave_bar = True

surface_tokenizer = AutoTokenizer.from_pretrained(surface_embedder_path)
generator_tokenizer = AutoTokenizer.from_pretrained(generator_embedder_path)
generator_tokenizer.padding_side = "left"

surface_embedding = SentenceTransformer(surface_embedder_path, device=device, model_kwargs={"torch_dtype": torch.float16})
generator_embedding = AutoModelForCausalLM.from_pretrained(generator_embedder_path, torch_dtype=torch.float16).to(device)

classifier_tokenizer = AutoTokenizer.from_pretrained(discriminator_path)
classifier = AutoModelForSequenceClassification.from_pretrained(discriminator_path)

classifier = classifier.to(device)

def generate(prompt, engine=engine):

    response = client.responses.create(
        model=engine,
        temperature=1e-8,
        input=[
            {
                "role": "user",
                "content": prompt
            }
        ]
    ).output_text

    return response

def load_ar_pairs(character):

    artifact = character2artifact[character]

    if not os.path.exists(f"data/title2action_series.{artifact}.json"):

        title2action_series = defaultdict(list)

        if artifact not in band2members:
            hf_path = "KomeijiForce/Fine_Grained_Fandom_Benchmark_Action_Sequences"
        else:
            hf_path = "KomeijiForce/Bandori_Conversational_Benchmark_Action_Sequences"
        for data in load_dataset(hf_path)["train"]:
            if data["artifact"] == artifact:
                title2action_series[data["title"]].append(data)

        json.dump(title2action_series, open(f"data/title2action_series.{artifact}.json", "w"))

    else:
        title2action_series = json.load(open(f"data/title2action_series.{artifact}.json"))

    all_actions = []
    pairs = []
    last_character = []
    for title in title2action_series:
        action_series = title2action_series[title]
        for item in action_series:
            all_actions.append(item["action"])
            if "character" in item:
                item["characters"] = [item["character"]]
            if character in item["characters"]:
                scene = "\n".join(all_actions[-1-10:-1])
                pairs.append({**item, "scene": scene, "last_character": last_character})
            last_character = item["characters"]

    return {"train": pairs[:len(pairs)//2], "test": pairs[len(pairs)//2:]}

def generative_encode(texts):
    embedding = generator_embedding(**generator_tokenizer(texts, return_tensors="pt", padding=True).to(device), output_hidden_states=True).hidden_states[-1][:, -1]
    embedding = F.normalize(embedding, p=2, dim=1)
    embedding = embedding.detach().cpu().numpy()
    return embedding

def surface_encode(texts):
    embedding = surface_embedding.encode(texts, convert_to_tensor=True)
    embedding = F.normalize(embedding, p=2, dim=1)
    embedding = embedding.detach().cpu().numpy()
    return embedding

def select_cluster_centers(character, pairs, n_in_cluster_case, n_in_cluster_sample, n_max_cluster=8, bs=8):

    actions = [pair["action"] for pair in pairs]
    scenes = [pair["scene"] for pair in pairs]

    with torch.no_grad():
        document_embeddings = []
        for idx in tqdm(range(0, len(actions), bs), desc="Embedding...", leave=leave_bar):
            scenes_batch = [scene+f"\n\nThus, {character} decides to" for scene in scenes[idx:idx+bs]]
            actions_batch = actions[idx:idx+bs]
            document_embeddings.append(np.concatenate([generative_encode(scenes_batch), surface_encode(actions_batch)], -1))

        document_embeddings = np.concatenate(document_embeddings, 0)

    n_clusters = min(int(np.ceil(document_embeddings.shape[0]/n_in_cluster_case)), n_max_cluster)
    kmeans = KMeans(n_clusters=n_clusters, random_state=42)

    kmeans.fit(document_embeddings)

    labels = kmeans.labels_
    centroids = kmeans.cluster_centers_

    clusters = []

    for centroid in centroids:
        distances = (((document_embeddings - centroid) ** 2).sum(-1)) ** 0.5
        cluster = []
        for idx in distances.argsort(-1)[:n_in_cluster_sample]:
            cluster.append(pairs[idx])
        clusters.append(cluster)

    return clusters

def check_scene(texts, questions):

    prompts = [f"Scene: {text}\n\nQuestion: {question}\n\nDirectly answer only yes/no/unknown." for text, question in zip(texts, questions)]

    with torch.no_grad():
        logits = classifier(**classifier_tokenizer(prompts, return_tensors="pt", padding=True).to(device)).logits
        choices = logits.argmax(-1)

    return [[False, None, True][choice.item()] for choice in choices]

def check_statement_probs(character, actions, statements):

    prompts = [f'''Character: {character}

Action: {action}

Statement: {statement}

Question: Does the statement provide correct grounding, which directly supports the character to take the action?

yes: the action involves direct information from the statement.

no: the action indicates the statement's assertion is not always correctly.

unknown: the action is irrelevant to the statement or the causal relationship cannot be determined

Directly answer only yes/no/unknown.''' for action, statement in zip(actions, statements)]

    with torch.no_grad():
        logits = classifier(**classifier_tokenizer(prompts, return_tensors="pt", padding=True).to(device)).logits
        probs = logits.softmax(-1).sum(0).detach().cpu().numpy()

    return probs

def make_hypothesis(cluster, character, goal_topic, established_statements, gate_path, k=3):

    action_scene_context = "\n\n".join(["# Scene:\n"+pair["scene"]+"\n# Action:\n"+pair["action"] for pair in cluster])
    established_statement_verbalized = "\n".join(established_statements) if len(established_statements) > 0 else "N/A"
    gate_path_verbalized = "\n".join(gate_path) if len(gate_path) > 0 else "N/A"

    prompt = f'''# Scene-Action Pairs
{action_scene_context}

# Established Statements
{established_statement_verbalized}

# Already Proposed Common Points
{gate_path_verbalized}

# Task

Your task is to build the grounding logic for an AI system to understand the behavior of {character} (Current topic: "{goal_topic}"), assert the AI system has no prior knowledge of {character}.
To do this, please propose hypotheses for the general behavior logic of {character} based on the given action-scene pairs, complete the task step by step:

1. What's the main feature of {character}'s behavior  (Focus on the current topic: "{goal_topic}") shown in the given scene-action pairs, **other than the already established statements**?

2. Summarize {k} potential common points (grounding statements) of the actions taken by {character} in the given scenes about the focused topic: "{goal_topic}", **which is other than the already established statements**.
- The grounding statements should be general, avoiding too specific action descriptions. (except when it's a common skill of the character)
- Consider the grounding statements in a general way.
- The grounding statements should be concise, informative, and general sentences.
- Never be assertive! Always make objective description of the character rather than making assertive causal relations.

3. Summarize {k} potential common points of the given scenes that trigger each behavior, **which should be different from already proposed common points.**
- The question should be simple, not ambiguous, and specific to a subset of scenes rather than always applicable.
- Focus on the **next action** when asking! Don't ask whether certain event is involved, instead ask whether the scene might trigger potential behavior for {character}'s **next action**.
- Directly include "{character}'s next action" in the question!

4. Output the hypothesized scene-action triggers in the following format:
```python
action_hypotheses = [] # A list of syntactically complete statements (always mentioning {character})
scene_check_hypotheses = [] # A list of syntactically complete questions to check the given scene (always mentioning {character})
```
'''

    response = generate(prompt)

    code_str = re.findall("```python(.*?)```", response, re.DOTALL)[0].strip()
    local_vars = {}
    exec(code_str, globals(), local_vars)

    action_hypotheses = local_vars["action_hypotheses"]
    scene_check_hypotheses = local_vars["scene_check_hypotheses"]

    return action_hypotheses, scene_check_hypotheses

def validate_hypothesis(character, pairs, hypothesized_question, hypothesized_action, bs=64):
    # When hypothesized_question is None, always check the statement

    res = defaultdict(int)
    filtered_pairs = []
    relevance_all = []

    for idx in tqdm(range(0, len(pairs), bs), desc="Filtering Scenes...", leave=leave_bar):

        pairs_batch = pairs[idx:idx+bs]

        scenes, actions = [pair["scene"] for pair in pairs_batch], [pair["action"] for pair in pairs_batch]

        if hypothesized_question is None:
            relevance = [True for _ in pairs_batch]
        else:
            relevance = check_scene(scenes, [hypothesized_question for pair in pairs_batch])
        relevance_all.extend(relevance)

    for pair, rel in zip(pairs, relevance_all):
        if rel:
            filtered_pairs.append(pair)
        else:
            res["Irrelevant"] += 1.0

    for idx in tqdm(range(0, len(filtered_pairs), bs), desc="Validating Statements...", leave=leave_bar):

        pairs_batch = filtered_pairs[idx:idx+bs]

        scenes, actions = [pair["scene"] for pair in pairs_batch], [pair["action"] for pair in pairs_batch]

        score = check_statement_probs(character, actions, [hypothesized_action for pair in pairs_batch])

        res["False"] += score[0]
        res["None"] += score[1]
        res["True"] += score[2]

    return res, filtered_pairs

def summarize_triggers(character, gates, statement_candidates):

    paired_hypotheses = [{"scene_check_hypothesis": gate, "action_hypothesis": statement_candidate}
                            for gate, statement_candidate in zip(gates, statement_candidates)]

    if len(paired_hypotheses) > 8:

        boost_prompt = f"""
# Task: Summarize & Compress Scene–Action Hypothesis Pairs into Top 8

You are given a list of paired hypotheses. Each pair contains:
- "scene_check_hypothesis": a question about {character}'s next action
- "action_hypothesis": a general behavioral grounding statement about {character}

Input pairs:
{paired_hypotheses}

## Goal
Produce a rewritten, deduplicated, and compressed set of **exactly 8** pairs that capture the **most important** and **most general** behavioral grounding logic for {{character}}.

Rewriting is allowed and encouraged to increase:
- generality
- coverage across different subsets of scenes
- clarity
- non-assertiveness

## Selection Principles (prioritized)
1. **Coverage**: The 8 pairs should collectively cover the widest range of distinct behavioral patterns and distinct scene triggers.
2. **Centrality**: Prefer pairs that reflect recurring or core behaviors across many scene-action pairs.
3. **Specificity without overfitting**: Keep statements general; only keep a specific skill/ability if it appears repeatedly and broadly.
4. **Non-redundancy**: Each of the 8 pairs must represent a meaningfully different behavior/trigger from the others.
5. **Pair coherence**: The scene_check_hypothesis must plausibly test for the corresponding action_hypothesis (do not mismatch them).

## Dedup & Merge Rules
- You may merge multiple similar input pairs into one rewritten pair.
- If two candidate pairs overlap heavily in either the action or the scene question, combine them into a single more general pair.
- Do not preserve original wording when a clearer/general rewrite is possible.

## Constraints to Preserve
### scene_check_hypothesis
- Must be a **single, simple question**
- Must explicitly contain the exact phrase: "{character}'s next action"
- Must target **scene conditions** that could trigger that next action
- Must be applicable to a **subset** of scenes (not a universal always-true condition)

### action_hypothesis
- Must be a **single, concise sentence**
- Must be **non-assertive** (use “may”, “tends to”, “often appears to”, “is described as”, “is observed as”, etc.)
- Must not invent backstory or assume prior knowledge

## Output Format (JSON only)
Return exactly 8 pairs:

```json
{{
  "top8_pairs": [
    {{
      "scene_check_hypothesis": "...",
      "action_hypothesis": "..."
    }},
    {{
      "scene_check_hypothesis": "...",
      "action_hypothesis": "..."
    }},
    ...
  ]
}}
````

## Quality Checklist (must satisfy)

* Exactly 8 pairs.
* No two action_hypothesis items mean the same thing.
* No two scene_check_hypothesis questions ask the same trigger.
* Each scene_check_hypothesis clearly tests for {character}'s next action.
* Each action_hypothesis is general, grounded, and non-assertive.
  """

        response = generate(boost_prompt)
        paired_hypotheses = json.loads(re.findall("```json(.*?)```", response, re.DOTALL)[0].strip())["top8_pairs"]

    gates = [pair["scene_check_hypothesis"] for pair in paired_hypotheses]
    statement_candidates = [pair["action_hypothesis"] for pair in paired_hypotheses]

    return gates, statement_candidates

class CDT_Node:
    def __init__(self, character, goal_topic, pairs, built_statements=None, depth=1, established_statements=[], gate_path=[], max_depth=3, threshold_accept=0.8, threshold_reject=0.5, threshold_filter=0.8):
        self.statements = []
        self.gates = [] # 1 gate -> 1 child
        self.children = []
        self.depth = depth

        if built_statements is not None:
            assert(pairs is None)
            self.statements = built_statements
        elif len(pairs) <= 8 or self.depth > max_depth:
            pass
        else:
            clusters = select_cluster_centers(character, pairs, n_in_cluster_case=16, n_in_cluster_sample=8, n_max_cluster=8, bs=8)
            statement_candidates, gates = [], []
            for cluster in tqdm(clusters, desc="Making Hypotheses...", leave=leave_bar):
                statement_candidates_cluster, gates_cluster = make_hypothesis(cluster, character, goal_topic, established_statements+self.statements, gate_path)
                statement_candidates.extend(statement_candidates_cluster)
                gates.extend(gates_cluster)

            gates, statement_candidates = summarize_triggers(character, gates, statement_candidates)
            global_statements, gated_statements = [], []
            remained_gates = []

            for gate, statement_candidate in zip(gates, statement_candidates):
                res, _ = validate_hypothesis(character, pairs, None, statement_candidate)
                correctness = res["True"]/(res["True"]+res["False"]+1e-8)+1e-8
                if correctness >= threshold_accept:
                    global_statements.append(statement_candidate)
                else:
                    gated_statements.append(statement_candidate)
                    remained_gates.append(gate)

            self.statements.extend(global_statements)

            for gate, statement_candidate in zip(remained_gates, gated_statements):
                res, filtered_pairs = validate_hypothesis(character, pairs, gate, statement_candidate)
                correctness = res["True"]/(res["True"]+res["False"]+1e-8)+1e-8
                broadness = 1-res["Irrelevant"]/sum(res.values())
                if broadness <= threshold_filter:
                    if correctness <= threshold_reject:
                        continue
                    elif correctness >= threshold_accept:
                        self.gates.append(gate)
                        self.children.append(CDT_Node(character, goal_topic, None, built_statements=[statement_candidate],
                            depth=depth+1, established_statements=established_statements+self.statements,
                                                      gate_path=gate_path+[gate], max_depth=max_depth,
                                                      threshold_accept=threshold_accept, threshold_reject=threshold_reject, threshold_filter=threshold_filter))
                    else:
                        self.gates.append(gate)
                        self.children.append(CDT_Node(character, goal_topic, filtered_pairs,
                            depth=depth+1, established_statements=established_statements+self.statements,
                                                      gate_path=gate_path+[gate], max_depth=max_depth,
                                                      threshold_accept=threshold_accept, threshold_reject=threshold_reject, threshold_filter=threshold_filter))

    def traverse(self, scene):
        statements = deepcopy(self.statements)
        for gate, child in zip(self.gates, self.children):
            if check_scene(scene, gate):
                statements.extend(child.traverse(scene))
        return statements

artifact = character2artifact[character]
artifact_characters = all_characters[artifact]["major"]
other_characters = [_character for _character in artifact_characters if _character != character]
pairs = load_ar_pairs(character)["train"]

topic2cdt = {}
rel_topic2cdt = {}

for attribute in ["identity", "personality", "ability", "relationship"]:
    goal_topic = f"{character}'s {attribute}"
    cdt_tree = CDT_Node(character, goal_topic, pairs, max_depth=max_depth, threshold_accept=threshold_accept, threshold_reject=threshold_reject, threshold_filter=threshold_filter)
    topic2cdt[goal_topic] = cdt_tree

for other_character in other_characters:
    goal_topic = f"{character}'s interaction with {other_character}"
    relation_pairs = [data for data in pairs if other_character in data["last_character"]]

    if len(relation_pairs) >= 16:
        cdt_tree = CDT_Node(character, goal_topic, relation_pairs, max_depth=max_depth, threshold_accept=threshold_accept, threshold_reject=threshold_reject, threshold_filter=threshold_filter)
        rel_topic2cdt[goal_topic] = cdt_tree

with open(f"packages/{character}.cdt.v3.1.package.relation.pkl", "wb") as f:
    pickle.dump({"topic2cdt": topic2cdt, "rel_topic2cdt": rel_topic2cdt}, f)