tgm-team · shenyangHuang · Dec 23, 2025 · Dec 23, 2025 · Dec 23, 2025 · Dec 23, 2025
diff --git a/examples/llm/TGTalker.py b/examples/llm/TGTalker.py
@@ -0,0 +1,196 @@
+import argparse
+import json
+import logging
+
+import numpy as np
+import outlines
+import torch
+from pydantic import BaseModel
+from tgb.linkproppred.evaluate import Evaluator
+from tgtalker_utils import make_system_prompt, make_user_prompt
+from tqdm import tqdm
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+from tgm import DGraph
+from tgm.constants import METRIC_TGB_LINKPROPPRED, RECIPE_TGB_LINK_PRED
+from tgm.data import DGData, DGDataLoader
+from tgm.hooks import RecencyNeighborHook, RecipeRegistry
+from tgm.util.logging import enable_logging, log_metric
+from tgm.util.seed import seed_everything
+
+# Setup logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+def predict_link(query_dst: torch.Tensor, llm_dst: int) -> torch.Tensor:
+    return (query_dst == llm_dst).float()
+
+
+class Step(BaseModel):
+    explanation: str
+    output: str
+
+
+class TGAnswer(BaseModel):
+    destination_node: int
+
+
+def main():
+    parser = argparse.ArgumentParser(description='TGTalker LinkPropPred Example')
+    parser.add_argument('--seed', type=int, default=42, help='random seed')
+    parser.add_argument('--dataset', type=str, default='tgbl-wiki', help='Dataset name')
+    parser.add_argument(
+        '--bsize', type=int, default=200, help='batch size (default 200 for TGB)'
+    )
+    parser.add_argument('--device', type=str, default='cuda', help='torch device')
+    parser.add_argument(
+        '--model',
+        type=str,
+        default='Qwen/Qwen3-1.7B',
+        help='Full huggingface model path',
+    )
+    parser.add_argument(
+        '--n-nbrs', type=int, default=10, help='num sampled nbrs (recency)'
+    )
+    parser.add_argument('--log-file-path', type=str, default=None)
+
+    args = parser.parse_args()
+    enable_logging(log_file_path=args.log_file_path)
+    seed_everything(args.seed)
+
+    logger.info(f'Loading dataset {args.dataset}...')
+    train_data, val_data, test_data = DGData.from_tgb(args.dataset).split()
+    logger.info('Initializing Graphs...')
+    train_dg = DGraph(train_data)
+    val_dg = DGraph(val_data)
+    test_dg = DGraph(test_data)
+
+    # set up neighbor hook
+    max_node_id = max(train_dg.num_nodes, val_dg.num_nodes, test_dg.num_nodes)
+    nbr_hook = RecencyNeighborHook(
+        num_nbrs=[args.n_nbrs],  # One hop
+        num_nodes=max_node_id + 1,
+        seed_nodes_keys=['src'],  # We only care about src history for the prompt
+        seed_times_keys=['time'],
+    )
+    hm = RecipeRegistry.build(
+        RECIPE_TGB_LINK_PRED, dataset_name=args.dataset, train_dg=train_dg
+    )
+    hm.register_shared(nbr_hook)
+    train_key, val_key, test_key = hm.keys
+
+    # Prepare Model
+    logger.info(f'Loading Model {args.model}...')
+    try:
+        model = AutoModelForCausalLM.from_pretrained(args.model).to(args.device)
+        tokenizer = AutoTokenizer.from_pretrained(args.model)
+        model = outlines.from_transformers(model, tokenizer)
+
+    except Exception as e:
+        logger.error(f'Failed to load model: {e}')
+        return
+
+    evaluator = Evaluator(name=args.dataset)
+    perf_list = []
+
+    train_loader = DGDataLoader(
+        train_dg, batch_size=200, hook_manager=hm
+    )  # Larger batch for fast warmup
+    val_loader = DGDataLoader(val_dg, batch_size=200, hook_manager=hm)
+
+    with hm.activate(train_key):
+        for batch in train_loader:
+            pass  # Hook automatically updates state
+
+    with hm.activate(val_key):
+        for batch in val_loader:
+            pass
+    logger.info('Registered Train/Val data into Recency neighbor sampler hook')
+
+    # start TGTalker Inference
+    test_loader = DGDataLoader(test_dg, batch_size=args.bsize, hook_manager=hm)
+
+    logger.info('Starting Inference on Test set...')
+
+    count = 0
+    with hm.activate(test_key):
+        for batch in tqdm(test_loader, desc='Test Inference'):
+            # batch.nids[0] keys: 'src', 'dst', 'neg' usually if link pred
+            # src nodes: batch.src
+            # times: batch.times[0] (seed times)
+
+            # The nbr_hook should have populated batch with neighbors.
+            # batch.nbr_nids -> List[Tensor]. batch.nbr_nids[0] for first hop.
+            # shape: [batch_size, num_nbrs]
+
+            srcs = batch.src.cpu().numpy()
+            times = batch.times[0].cpu().numpy()
+
+            if hasattr(batch, 'nbr_nids') and len(batch.nbr_nids) > 0:
+                nbr_nids_batch = batch.nbr_nids[0].cpu().numpy()
+                nbr_times_batch = batch.nbr_times[0].cpu().numpy()
+            else:
+                raise ValueError('Neighbor hook did not populate batch with neighbors')
+
+            # Iterate through batch
+            for i in range(len(srcs)):
+                src = srcs[i]
+                ts = times[i]
+                current_nbr_nids = nbr_nids_batch[i]
+                current_nbr_times = nbr_times_batch[i]
+
+                system_prompt = make_system_prompt()
+                print(src)
+                print(ts)
+                print(current_nbr_nids)
+                print(current_nbr_times)
+                quit()
+                user_prompt = make_user_prompt(
+                    src, ts, current_nbr_nids, current_nbr_times
+                )
+
+                # Construct full prompt for Chat model
+                messages = [
+                    {'role': 'system', 'content': system_prompt},
+                    {'role': 'user', 'content': user_prompt},
+                ]
+                # Apply chat template
+                prompt = tokenizer.apply_chat_template(
+                    messages, tokenize=False, add_generation_prompt=True
+                )
+
+                output = model(
+                    prompt,
+                    TGAnswer,
+                )
+
+                try:
+                    data = json.loads(output)
+                    pred_dst = int(data['destination_node'])
+                    query_dst = torch.cat(
+                        [batch.dst[i].unsqueeze(0), batch.neg_batch_list[i]]
+                    )
+                    y_pred = predict_link(query_dst, pred_dst)
+
+                    input_dict = {
+                        'y_pred_pos': y_pred[0],
+                        'y_pred_neg': y_pred[1:],
+                        'eval_metric': [METRIC_TGB_LINKPROPPRED],
+                    }
+                    perf_list.append(
+                        evaluator.eval(input_dict)[METRIC_TGB_LINKPROPPRED]
+                    )
+                except Exception as e:
+                    logger.error(f'Generation failed: {e}')
+                    logger.info('Generation failed as output: ' + output)
+                    perf_list.append(0.0)
+                count += 1
+
+    score = np.mean(perf_list)
+    logger.info(f'Test Score (MRR): {score}')
+    log_metric('MRR', score)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/examples/llm/test_tgtalker.py b/examples/llm/test_tgtalker.py
@@ -0,0 +1,25 @@
+import pytest
+import torch
+from tgtalker_utils import make_system_prompt, make_user_prompt
+
+
+def test_make_system_prompt():
+    system_prompt = make_system_prompt()
+    assert system_prompt is not None and len(system_prompt) > 0
+
+
+def test_make_user_prompt():
+    src = 1
+    ts = 200
+    user_prompt = make_user_prompt(src, ts)
+    assert user_prompt is not None and len(user_prompt) > 0
+
+
+def test_bad_arg_user_prompt():
+    src = torch.IntTensor([0, 1, 2, 3])
+    ts = torch.IntTensor([5, 5])
+    with pytest.raises(ValueError):
+        make_user_prompt(src, ts)
+
+    with pytest.raises(ValueError):
+        make_user_prompt(None, None)
diff --git a/examples/llm/tgtalker_utils.py b/examples/llm/tgtalker_utils.py
@@ -0,0 +1,34 @@
+from tgm.constants import PADDED_NODE_ID
+
+
+def make_user_prompt(src: int, ts: int, nbr_nids=None, nbr_times=None):
+    if src is None or ts is None:
+        raise ValueError('Source node and timestamp must be provided')
+
+    if not isinstance(src, int) or not isinstance(ts, int):
+        raise ValueError('Source node and timestamp must be integers')
+
+    if nbr_nids is not None and len(nbr_nids) > 0:
+        user_prompt = f',Source Node` {src} has the following past interactions:\n'
+        # Filter out padded nodes
+        valid_indices = [i for i, n in enumerate(nbr_nids) if n != PADDED_NODE_ID]
+
+        for idx in valid_indices:
+            dst = int(nbr_nids[idx])
+            timestamp = int(nbr_times[idx])
+            user_prompt += f'{src}, {dst}, {timestamp}) \n'
+
+        user_prompt += f'Please predict the most likely `Destination Node` for `Source Node` {src} at `Timestamp` {ts}.'
+    else:
+        user_prompt = (
+            f'Predict the next interaction for source node {src} at time {ts},'
+        )
+    return user_prompt
+
+
+def make_system_prompt():
+    system_prompt = (
+        f'You are an expert temporal graph learning agent. Your task is to predict the next interaction (i.e. Destination Node) given the `Source Node` and `Timestamp`.\n\n'
+        f'Description of the temporal graph is provided below, where each line is a tuple of (`Source Node`, `Destination Node`, `Timestamp`).\n\nTEMPORAL GRAPH:\n'
+    )
+    return system_prompt
diff --git a/pyproject.toml b/pyproject.toml
@@ -22,6 +22,10 @@ analytics = [
     "scipy>=1.15.2",
     "tqdm>=4.67.1",
 ]
+llm = [
+    "outlines>=1.2.9",
+    "transformers>=4.36.2",
+]
 dev = [
     "isort>=5.13.2",
     "mypy>=1.13.0",