pyg-team
diff --git a/‎CHANGELOG.md‎
Lines changed: 4 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎examples/README.md‎
Lines changed: 2 additions & 0 deletions b/‎examples/README.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎examples/ar_link_pred.py‎
Lines changed: 216 additions & 0 deletions b/‎examples/ar_link_pred.py‎
Lines changed: 216 additions & 0 deletions
diff --git a/‎examples/llm/README.md‎
Lines changed: 9 additions & 9 deletions b/‎examples/llm/README.md‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎examples/llm/g_retriever.py‎
Lines changed: 2 additions & 0 deletions b/‎examples/llm/g_retriever.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎test/contrib/explain/test_pgm_explainer.py‎
Lines changed: 2 additions & 1 deletion b/‎test/contrib/explain/test_pgm_explainer.py‎
Lines changed: 2 additions & 1 deletion
@@ -8,6 +8,10 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 ### Added
 
 - Added `Polynormer` model and example ([#9908](https://github.com/pyg-team/pytorch_geometric/pull/9908))
+- Added support for heterogenous graphs in `GNNExplainer` ([#10158](https://github.com/pyg-team/pytorch_geometric/pull/10158))
+- Added Graph Positional and Structural Encoder (GPSE) ([#9018](https://github.com/pyg-team/pytorch_geometric/pull/9018))
+- Added attract-repel link prediction example ([#10107](https://github.com/pyg-team/pytorch_geometric/pull/10107))
+- Added `ARLinkPredictor` for implementing Attract-Repel embeddings for link prediction ([#10105](https://github.com/pyg-team/pytorch_geometric/pull/10105))
 - Improving documentation for [cuGraph](https://github.com/rapidsai/cugraph) ([#10083](https://github.com/pyg-team/pytorch_geometric/pull/10083))
 - Added `HashTensor` ([#10072](https://github.com/pyg-team/pytorch_geometric/pull/10072))
 - Added `SGFormer` model and example ([#9904](https://github.com/pyg-team/pytorch_geometric/pull/9904))
 
@@ -7,6 +7,8 @@ A great and simple example to start with is [`gcn.py`](./gcn.py), showing a user
 
 For a simple link prediction example, see [`link_pred.py`](./link_pred.py).
 
+For an improved link prediction approach using Attract-Repel embeddings that can significantly boost accuracy (up to 23% improvement in AUC), see [`ar_link_pred.py`](./ar_link_pred.py). This approach is based on [Pseudo-Euclidean Attract-Repel Embeddings for Undirected Graphs](https://arxiv.org/abs/2106.09671).
+
 For examples on [Open Graph Benchmark](https://ogb.stanford.edu/) datasets, see the `ogbn_*.py` examples:
 
 - [`ogbn_train.py`](./ogbn_train.py) is an example for training a GNN on the large-scale `ogbn-papers100m` dataset, containing approximately ~1.6B edges or the medium scale `ogbn-products` dataset, ~62M edges.
 
@@ -0,0 +1,216 @@
+import argparse
+import os.path as osp
+
+import torch
+import torch.nn.functional as F
+
+import torch_geometric.transforms as T
+from torch_geometric.datasets import Planetoid
+from torch_geometric.nn import GCNConv
+from torch_geometric.utils import negative_sampling, train_test_split_edges
+
+
+class GCNEncoder(torch.nn.Module):
+    def __init__(self, in_channels, hidden_channels, out_channels):
+        super().__init__()
+        self.conv1 = GCNConv(in_channels, hidden_channels)
+        self.conv2 = GCNConv(hidden_channels, out_channels)
+
+    def forward(self, x, edge_index):
+        x = self.conv1(x, edge_index).relu()
+        return self.conv2(x, edge_index)
+
+
+class LinkPredictor(torch.nn.Module):
+    def __init__(self, in_channels, hidden_channels):
+        super().__init__()
+        self.lin1 = torch.nn.Linear(in_channels * 2, hidden_channels)
+        self.lin2 = torch.nn.Linear(hidden_channels, 1)
+
+    def forward(self, z_i, z_j):
+        x = torch.cat([z_i, z_j], dim=1)
+        x = self.lin1(x).relu()
+        x = self.lin2(x)
+        return x.view(-1)
+
+
+class ARLinkPredictor(torch.nn.Module):
+    def __init__(self, in_channels):
+        super().__init__()
+        # Split dimensions between attract and repel
+        self.attract_dim = in_channels // 2
+        self.repel_dim = in_channels - self.attract_dim
+
+    def forward(self, z_i, z_j):
+        # Split into attract and repel parts
+        z_i_attr = z_i[:, :self.attract_dim]
+        z_i_repel = z_i[:, self.attract_dim:]
+
+        z_j_attr = z_j[:, :self.attract_dim]
+        z_j_repel = z_j[:, self.attract_dim:]
+
+        # Calculate AR score
+        attract_score = (z_i_attr * z_j_attr).sum(dim=1)
+        repel_score = (z_i_repel * z_j_repel).sum(dim=1)
+
+        return attract_score - repel_score
+
+
+def train(encoder, predictor, data, optimizer):
+    encoder.train()
+    predictor.train()
+
+    # Forward pass and calculate loss
+    optimizer.zero_grad()
+    z = encoder(data.x, data.train_pos_edge_index)
+
+    # Positive edges
+    pos_out = predictor(z[data.train_pos_edge_index[0]],
+                        z[data.train_pos_edge_index[1]])
+
+    # Sample and predict on negative edges
+    neg_edge_index = negative_sampling(
+        edge_index=data.train_pos_edge_index,
+        num_nodes=data.num_nodes,
+        num_neg_samples=data.train_pos_edge_index.size(1),
+    )
+    neg_out = predictor(z[neg_edge_index[0]], z[neg_edge_index[1]])
+
+    # Calculate loss
+    pos_loss = F.binary_cross_entropy_with_logits(pos_out,
+                                                  torch.ones_like(pos_out))
+    neg_loss = F.binary_cross_entropy_with_logits(neg_out,
+                                                  torch.zeros_like(neg_out))
+    loss = pos_loss + neg_loss
+
+    loss.backward()
+    optimizer.step()
+
+    return loss.item()
+
+
+@torch.no_grad()
+def test(encoder, predictor, data):
+    encoder.eval()
+    predictor.eval()
+
+    z = encoder(data.x, data.train_pos_edge_index)
+
+    pos_val_out = predictor(z[data.val_pos_edge_index[0]],
+                            z[data.val_pos_edge_index[1]])
+    neg_val_out = predictor(z[data.val_neg_edge_index[0]],
+                            z[data.val_neg_edge_index[1]])
+
+    pos_test_out = predictor(z[data.test_pos_edge_index[0]],
+                             z[data.test_pos_edge_index[1]])
+    neg_test_out = predictor(z[data.test_neg_edge_index[0]],
+                             z[data.test_neg_edge_index[1]])
+
+    val_auc = compute_auc(pos_val_out, neg_val_out)
+    test_auc = compute_auc(pos_test_out, neg_test_out)
+
+    return val_auc, test_auc
+
+
+def compute_auc(pos_out, neg_out):
+    pos_out = torch.sigmoid(pos_out).cpu().numpy()
+    neg_out = torch.sigmoid(neg_out).cpu().numpy()
+
+    # Simple AUC calculation
+    from sklearn.metrics import roc_auc_score
+    y_true = torch.cat(
+        [torch.ones(pos_out.shape[0]),
+         torch.zeros(neg_out.shape[0])])
+    y_score = torch.cat([torch.tensor(pos_out), torch.tensor(neg_out)])
+
+    return roc_auc_score(y_true, y_score)
+
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--dataset', type=str, default='Cora',
+                        choices=['Cora', 'CiteSeer', 'PubMed'])
+    parser.add_argument('--hidden_channels', type=int, default=128)
+    parser.add_argument('--out_channels', type=int, default=64)
+    parser.add_argument('--epochs', type=int, default=200)
+    parser.add_argument('--use_ar', action='store_true',
+                        help='Use Attract-Repel embeddings')
+    parser.add_argument('--lr', type=float, default=0.01)
+    args = parser.parse_args()
+
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+
+    # Load dataset
+    transform = T.Compose([
+        T.NormalizeFeatures(),
+        T.ToDevice(device),
+    ])
+
+    path = osp.join(osp.dirname(osp.realpath(__file__)), '..', 'data',
+                    args.dataset)
+    dataset = Planetoid(path, args.dataset, transform=transform)
+    data = dataset[0]
+
+    # Process data for link prediction
+    data = train_test_split_edges(data)
+
+    # Initialize encoder
+    encoder = GCNEncoder(
+        in_channels=dataset.num_features,
+        hidden_channels=args.hidden_channels,
+        out_channels=args.out_channels,
+    ).to(device)
+
+    # Choose predictor based on args
+    if args.use_ar:
+        predictor = ARLinkPredictor(in_channels=args.out_channels).to(device)
+        print(f"Running link prediction on {args.dataset}"
+              f"with Attract-Repel embeddings")
+    else:
+        predictor = LinkPredictor(
+            in_channels=args.out_channels,
+            hidden_channels=args.hidden_channels).to(device)
+        print(f"Running link prediction on {args.dataset}"
+              f"with Traditional embeddings")
+
+    optimizer = torch.optim.Adam(
+        list(encoder.parameters()) + list(predictor.parameters()), lr=args.lr)
+
+    best_val_auc = 0
+    final_test_auc = 0
+
+    for epoch in range(1, args.epochs + 1):
+        loss = train(encoder, predictor, data, optimizer)
+        val_auc, test_auc = test(encoder, predictor, data)
+
+        if val_auc > best_val_auc:
+            best_val_auc = val_auc
+            final_test_auc = test_auc
+
+        if epoch % 10 == 0:
+            print(f'Epoch: {epoch:03d}, Loss: {loss:.4f}, '
+                  f'Val AUC: {val_auc:.4f}, '
+                  f'Test AUC: {test_auc:.4f}')
+
+    print(f'Final results - Val AUC: {best_val_auc:.4f}, '
+          f'Test AUC: {final_test_auc:.4f}')
+
+    # Calculate R-fraction if using AR
+    if args.use_ar:
+        with torch.no_grad():
+            z = encoder(data.x, data.train_pos_edge_index)
+            attr_dim = args.out_channels // 2
+
+            z_attr = z[:, :attr_dim]
+            z_repel = z[:, attr_dim:]
+
+            attract_norm_squared = torch.sum(z_attr**2)
+            repel_norm_squared = torch.sum(z_repel**2)
+
+            r_fraction = repel_norm_squared / (attract_norm_squared +
+                                               repel_norm_squared)
+            print(f"R-fraction: {r_fraction.item():.4f}")
+
+
+if __name__ == '__main__':
+    main()
@@ -1,11 +1,11 @@
 # Examples for Co-training LLMs and GNNs
 
-| Example                                      | Description                                                                                                                                                                                                                                                                                                    |
-| -------------------------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| [`g_retriever.py`](./g_retriever.py)         | Example for Retrieval-Augmented Generation (RAG) w/ GNN+LLM by co-training `LLAMA3` with `GAT` for answering questions based on knowledge graph information. We also have an [example repo](https://github.com/neo4j-product-examples/neo4j-gnn-llm-example) for integration with [Neo4j Graph DBs][neo4j.com] |
-| [`g_retriever_utils/`](./g_retriever_utils/) | Contains multiple scripts for benchmarking GRetriever's architecture and evaluating different retrieval methods.                                                                                                                                                                                               |
-| [`multihop_rag/`](./multihop_rag/)           | Contains starter code and an example run for building a Multi-hop dataset using WikiHop5M and 2WikiMultiHopQA                                                                                                                                                                                                  |
-| [`nvtx_examples/`](./nvtx_examples/)         | Contains examples of how to wrap functions using the NVTX profiler for CUDA runtime analysis.                                                                                                                                                                                                                  |
-| [`molecule_gpt.py`](./molecule_gpt.py)       | Example for MoleculeGPT: Instruction Following Large Language Models for Molecular Property Prediction. Supports MoleculeGPT and InstructMol dataset                                                                                                                                                           |
-| [`glem.py`](./glem.py)                       | Example for [GLEM](https://arxiv.org/abs/2210.14709), a GNN+LLM co-training model via variational Expectation-Maximization (EM) framework on node classification tasks to achieve SOTA results                                                                                                                 |
-| [`git_mol.py`](./git_mol.py)                 | Example for GIT-Mol: A Multi-modal Large Language Model for Molecular Science with Graph, Image, and Text                                                                                                                                                                                                      |
+| Example                                      | Description                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| -------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [`g_retriever.py`](./g_retriever.py)         | Example for Retrieval-Augmented Generation (RAG) w/ GNN+LLM by co-training `LLAMA3` with `GAT` for answering questions based on knowledge graph information from the toy WebQSP dataset. We also have an [example repo](https://github.com/neo4j-product-examples/neo4j-gnn-llm-example) for integration with [Neo4j Graph DBs][neo4j.com] along with an associated [blog](https://developer.nvidia.com/blog/boosting-qa-accuracy-with-graphrag-using-pyg-and-graph-databases/) showing 2x accuracy gains over LLMs on real medical data. |
+| [`g_retriever_utils/`](./g_retriever_utils/) | Contains multiple scripts for benchmarking GRetriever's architecture and evaluating different retrieval methods.                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| [`multihop_rag/`](./multihop_rag/)           | Contains starter code and an example run for building a Multi-hop dataset using WikiHop5M and 2WikiMultiHopQA                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| [`nvtx_examples/`](./nvtx_examples/)         | Contains examples of how to wrap functions using the NVTX profiler for CUDA runtime analysis.                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| [`molecule_gpt.py`](./molecule_gpt.py)       | Example for MoleculeGPT: Instruction Following Large Language Models for Molecular Property Prediction. Supports MoleculeGPT and InstructMol dataset                                                                                                                                                                                                                                                                                                                                                                                      |
+| [`glem.py`](./glem.py)                       | Example for [GLEM](https://arxiv.org/abs/2210.14709), a GNN+LLM co-training model via variational Expectation-Maximization (EM) framework on node classification tasks to achieve SOTA results                                                                                                                                                                                                                                                                                                                                            |
+| [`git_mol.py`](./git_mol.py)                 | Example for GIT-Mol: A Multi-modal Large Language Model for Molecular Science with Graph, Image, and Text                                                                                                                                                                                                                                                                                                                                                                                                                                 |
@@ -9,6 +9,8 @@
 
 Example repo for integration with Neo4j Graph DB:
 https://github.com/neo4j-product-examples/neo4j-gnn-llm-example
+Example blog showing 2x accuracy over LLM on real medical data:
+https://developer.nvidia.com/blog/boosting-qa-accuracy-with-graphrag-using-pyg-and-graph-databases/
 """
 import argparse
 import gc
 
@@ -5,7 +5,7 @@
 from torch_geometric.explain import Explainer
 from torch_geometric.explain.config import ModelConfig
 from torch_geometric.nn import GCNConv, global_add_pool
-from torch_geometric.testing import withPackage
+from torch_geometric.testing import minPython, withPackage
 
 
 class GCN(torch.nn.Module):
@@ -45,6 +45,7 @@ def forward(self, x, edge_index, edge_weight=None, batch=None, **kwargs):
 edge_label_index = torch.tensor([[0, 1, 2], [3, 4, 5]])
 
 
+@minPython('3.10')
 @withPackage('pgmpy', 'pandas')
 @pytest.mark.parametrize('node_idx', [2, 6])
 @pytest.mark.parametrize('task_level, perturbation_mode', [