├── README.md ├── edge_list_short.txt ├── hetero-intro.ipynb ├── hetero-attention.ipynb ├── basics-of-graphs.ipynb └── GCN_hetero.ipynb /README.md: -------------------------------------------------------------------------------- 1 | # graphs 2 | This is the repo for the post "deep learning on graphs" 3 | -------------------------------------------------------------------------------- /edge_list_short.txt: -------------------------------------------------------------------------------- 1 | 0 1 2 | 0 2 3 | 1 2 4 | 1 3 5 | 1 4 6 | 2 4 7 | 2 0 8 | 2 1 9 | 3 4 10 | 3 1 11 | 4 3 12 | 4 0 -------------------------------------------------------------------------------- /hetero-intro.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "### introduction to Heterogenous Graphs\n", 8 | "this note book provide the details of the heterograph of the acm dataset that is discussed in the blog." 9 | ] 10 | }, 11 | { 12 | "cell_type": "code", 13 | "execution_count": 77, 14 | "metadata": {}, 15 | "outputs": [], 16 | "source": [ 17 | "%matplotlib inline\n", 18 | "import dgl\n", 19 | "import numpy as np\n", 20 | "import scipy.sparse as sp\n", 21 | "# Creating from networkx graph\n", 22 | "import networkx as nx\n", 23 | "import scipy.io\n", 24 | "import urllib.request\n" 25 | ] 26 | }, 27 | { 28 | "cell_type": "code", 29 | "execution_count": 2, 30 | "metadata": {}, 31 | "outputs": [ 32 | { 33 | "name": "stdout", 34 | "output_type": "stream", 35 | "text": [ 36 | "['__header__', '__version__', '__globals__', 'TvsP', 'PvsA', 'PvsV', 'AvsF', 'VvsC', 'PvsL', 'PvsC', 'A', 'C', 'F', 'L', 'P', 'T', 'V', 'PvsT', 'CNormPvsA', 'RNormPvsA', 'CNormPvsC', 'RNormPvsC', 'CNormPvsT', 'RNormPvsT', 'CNormPvsV', 'RNormPvsV', 'CNormVvsC', 'RNormVvsC', 'CNormAvsF', 'RNormAvsF', 'CNormPvsL', 'RNormPvsL', 'stopwords', 'nPvsT', 'nT', 'CNormnPvsT', 'RNormnPvsT', 'nnPvsT', 'nnT', 'CNormnnPvsT', 'RNormnnPvsT', 'PvsP', 'CNormPvsP', 'RNormPvsP']\n" 37 | ] 38 | } 39 | ], 40 | "source": [ 41 | "data_url = 'https://data.dgl.ai/dataset/ACM.mat'\n", 42 | "data_file_path = 'ACM.mat'\n", 43 | "\n", 44 | "urllib.request.urlretrieve(data_url, data_file_path)\n", 45 | "data = scipy.io.loadmat(data_file_path)\n", 46 | "print(list(data.keys()))" 47 | ] 48 | }, 49 | { 50 | "cell_type": "code", 51 | "execution_count": 78, 52 | "metadata": {}, 53 | "outputs": [ 54 | { 55 | "data": { 56 | "text/plain": [ 57 | "Graph(num_nodes={'author': 17431, 'paper': 12499, 'subject': 73},\n", 58 | " num_edges={('paper', 'written-by', 'author'): 37055, ('author', 'writing', 'paper'): 37055, ('paper', 'citing', 'paper'): 30789, ('paper', 'cited', 'paper'): 30789, ('paper', 'is-about', 'subject'): 12499, ('subject', 'has', 'paper'): 12499},\n", 59 | " metagraph=[('author', 'paper'), ('paper', 'author'), ('paper', 'paper'), ('paper', 'paper'), ('paper', 'subject'), ('subject', 'paper')])" 60 | ] 61 | }, 62 | "execution_count": 78, 63 | "metadata": {}, 64 | "output_type": "execute_result" 65 | } 66 | ], 67 | "source": [ 68 | "G = dgl.heterograph({\n", 69 | " ('paper', 'written-by', 'author') : data['PvsA'],\n", 70 | " ('author', 'writing', 'paper') : data['PvsA'].transpose(),\n", 71 | " ('paper', 'citing', 'paper') : data['PvsP'],\n", 72 | " ('paper', 'cited', 'paper') : data['PvsP'].transpose(),\n", 73 | " ('paper', 'is-about', 'subject') : data['PvsL'],\n", 74 | " ('subject', 'has', 'paper') : data['PvsL'].transpose(),\n", 75 | " })\n", 76 | "G" 77 | ] 78 | }, 79 | { 80 | "cell_type": "code", 81 | "execution_count": 11, 82 | "metadata": {}, 83 | "outputs": [ 84 | { 85 | "data": { 86 | "text/plain": [ 87 | "['author', 'paper', 'subject']" 88 | ] 89 | }, 90 | "execution_count": 11, 91 | "metadata": {}, 92 | "output_type": "execute_result" 93 | } 94 | ], 95 | "source": [ 96 | "G.ntypes" 97 | ] 98 | }, 99 | { 100 | "cell_type": "code", 101 | "execution_count": 17, 102 | "metadata": {}, 103 | "outputs": [ 104 | { 105 | "data": { 106 | "text/plain": [ 107 | "tensor([ 0, 1, 2, ..., 17428, 17429, 17430])" 108 | ] 109 | }, 110 | "execution_count": 17, 111 | "metadata": {}, 112 | "output_type": "execute_result" 113 | } 114 | ], 115 | "source": [ 116 | "G.nodes('author')" 117 | ] 118 | }, 119 | { 120 | "cell_type": "code", 121 | "execution_count": 112, 122 | "metadata": {}, 123 | "outputs": [], 124 | "source": [ 125 | "def author(number):\n", 126 | " return data['A'][number][0][0]\n", 127 | "def find_author_by_name(name):\n", 128 | " for i in range(17430):\n", 129 | " if author(i).find(name) >= 0:\n", 130 | " print(i, author(i))" 131 | ] 132 | }, 133 | { 134 | "cell_type": "code", 135 | "execution_count": 113, 136 | "metadata": {}, 137 | "outputs": [ 138 | { 139 | "name": "stdout", 140 | "output_type": "stream", 141 | "text": [ 142 | "5100 Jack J. Dongarra\n" 143 | ] 144 | } 145 | ], 146 | "source": [ 147 | "find_author_by_name(\"Dongarra\")" 148 | ] 149 | }, 150 | { 151 | "cell_type": "code", 152 | "execution_count": 104, 153 | "metadata": {}, 154 | "outputs": [], 155 | "source": [ 156 | "def institution(number):\n", 157 | " return data['F'][number][0][0]\n", 158 | "def find_institution_by_name(name):\n", 159 | " for i in range(len(data['F'])):\n", 160 | " if institution(i).find(name) >= 0:\n", 161 | " print(i, institution(i))" 162 | ] 163 | }, 164 | { 165 | "cell_type": "code", 166 | "execution_count": 115, 167 | "metadata": {}, 168 | "outputs": [], 169 | "source": [ 170 | "def subject(number):\n", 171 | " return data['L'][number][0][0]" 172 | ] 173 | }, 174 | { 175 | "cell_type": "code", 176 | "execution_count": 105, 177 | "metadata": {}, 178 | "outputs": [ 179 | { 180 | "name": "stdout", 181 | "output_type": "stream", 182 | "text": [ 183 | "231 Indiana University\n", 184 | "232 Indiana University Purdue University Indianapolis\n" 185 | ] 186 | } 187 | ], 188 | "source": [ 189 | "find_institution_by_name(\"Indiana\")" 190 | ] 191 | }, 192 | { 193 | "cell_type": "code", 194 | "execution_count": 107, 195 | "metadata": {}, 196 | "outputs": [ 197 | { 198 | "name": "stdout", 199 | "output_type": "stream", 200 | "text": [ 201 | "5100 Jack J. Dongarra\n" 202 | ] 203 | } 204 | ], 205 | "source": [] 206 | }, 207 | { 208 | "cell_type": "code", 209 | "execution_count": 108, 210 | "metadata": {}, 211 | "outputs": [ 212 | { 213 | "name": "stdout", 214 | "output_type": "stream", 215 | "text": [ 216 | "6313 David S. Wise\n", 217 | "9342 Charles Wiseman\n", 218 | "11618 G. Bowden Wise\n" 219 | ] 220 | } 221 | ], 222 | "source": [ 223 | "find_author_by_name(\"Wise\")" 224 | ] 225 | }, 226 | { 227 | "cell_type": "code", 228 | "execution_count": 35, 229 | "metadata": {}, 230 | "outputs": [ 231 | { 232 | "data": { 233 | "text/plain": [ 234 | "Graph(num_nodes={'author': 17431, 'paper': 12499},\n", 235 | " num_edges={('author', 'writing', 'paper'): 37055},\n", 236 | " metagraph=[('author', 'paper')])" 237 | ] 238 | }, 239 | "execution_count": 35, 240 | "metadata": {}, 241 | "output_type": "execute_result" 242 | } 243 | ], 244 | "source": [ 245 | "G['writing']" 246 | ] 247 | }, 248 | { 249 | "cell_type": "code", 250 | "execution_count": 57, 251 | "metadata": {}, 252 | "outputs": [ 253 | { 254 | "data": { 255 | "text/plain": [ 256 | "(tensor([5100]), tensor([9626]))" 257 | ] 258 | }, 259 | "execution_count": 57, 260 | "metadata": {}, 261 | "output_type": "execute_result" 262 | } 263 | ], 264 | "source": [ 265 | "G['writing'].out_edges(5100)" 266 | ] 267 | }, 268 | { 269 | "cell_type": "code", 270 | "execution_count": 58, 271 | "metadata": {}, 272 | "outputs": [ 273 | { 274 | "data": { 275 | "text/plain": [ 276 | "array([array([\"'Bi-objective scheduling algorithms for optimizing makespan and reliability on heterogeneous systems We tackle the problem of scheduling task graphs onto a heterogeneous set of machines, where each processor has a probability of failure governed by an exponential law. The goal is to design algorithms that optimize both makespan and reliability. First, we provide an optimal scheduling algorithm for independent unitary tasks where the objective is to maximize the reliability subject to makespan minimization. For the bi-criteria case, we provide an algorithm that approximates the Pareto-curve. Next, for independent non-unitary tasks, we show that the product { failure rate }x { unitary instruction execution time } is crucial to distinguish processors in this context. Based on these results we are able to let the user choose a trade-off between reliability maximization and makespan minimization. For general task graphs we provide a method for converting scheduling heuristics on heterogeneous cluster into heuristics that take reliability into account. Here again, we show how we can help the user to select a trade-off between makespan and reliability. '\"],\n", 277 | " dtype='\n", 512 | "\n", 525 | "\n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | "
0123
sosp80.02.016.02.0
soda0.096.02.01.0
sigcom7.04.086.02.0
vldb0.01.02.097.0
\n", 566 | "" 567 | ], 568 | "text/plain": [ 569 | " 0 1 2 3\n", 570 | "sosp 80.0 2.0 16.0 2.0\n", 571 | "soda 0.0 96.0 2.0 1.0\n", 572 | "sigcom 7.0 4.0 86.0 2.0\n", 573 | "vldb 0.0 1.0 2.0 97.0" 574 | ] 575 | }, 576 | "execution_count": 46, 577 | "metadata": {}, 578 | "output_type": "execute_result" 579 | } 580 | ], 581 | "source": [ 582 | "import pandas as pd\n", 583 | "df = pd.DataFrame(mat, index =['sosp', 'soda', 'sigcom','vldb'])\n", 584 | "df" 585 | ] 586 | }, 587 | { 588 | "cell_type": "code", 589 | "execution_count": null, 590 | "metadata": {}, 591 | "outputs": [], 592 | "source": [] 593 | } 594 | ], 595 | "metadata": { 596 | "kernelspec": { 597 | "display_name": "Python 3", 598 | "language": "python", 599 | "name": "python3" 600 | }, 601 | "language_info": { 602 | "codemirror_mode": { 603 | "name": "ipython", 604 | "version": 3 605 | }, 606 | "file_extension": ".py", 607 | "mimetype": "text/x-python", 608 | "name": "python", 609 | "nbconvert_exporter": "python", 610 | "pygments_lexer": "ipython3", 611 | "version": "3.7.4" 612 | } 613 | }, 614 | "nbformat": 4, 615 | "nbformat_minor": 2 616 | } 617 | -------------------------------------------------------------------------------- /basics-of-graphs.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": 2, 6 | "metadata": {}, 7 | "outputs": [ 8 | { 9 | "name": "stderr", 10 | "output_type": "stream", 11 | "text": [ 12 | "Using backend: pytorch\n" 13 | ] 14 | } 15 | ], 16 | "source": [ 17 | "import dgl\n", 18 | "import dgl.function as fn\n", 19 | "import torch as th\n", 20 | "import torch.nn as nn\n", 21 | "import torch.nn.functional as F\n", 22 | "from dgl import DGLGraph\n", 23 | "import numpy as np\n", 24 | "import networkx as nx\n", 25 | "#from res.plot_lib import set_default\n", 26 | "import matplotlib.pyplot as plt\n", 27 | "%matplotlib inline\n", 28 | "from gensim.models import Word2Vec\n", 29 | "import random\n" 30 | ] 31 | }, 32 | { 33 | "cell_type": "raw", 34 | "metadata": {}, 35 | "source": [ 36 | "contents of the file \"edge_list_short.txt\"\n", 37 | "0 1\n", 38 | "0 2\n", 39 | "1 2\n", 40 | "1 3\n", 41 | "1 4\n", 42 | "2 4\n", 43 | "2 0\n", 44 | "2 1\n", 45 | "3 4\n", 46 | "3 1\n", 47 | "4 3\n", 48 | "4 0" 49 | ] 50 | }, 51 | { 52 | "cell_type": "code", 53 | "execution_count": 20, 54 | "metadata": {}, 55 | "outputs": [ 56 | { 57 | "data": { 58 | "image/png": "\n", 59 | "text/plain": [ 60 | "
" 61 | ] 62 | }, 63 | "metadata": {}, 64 | "output_type": "display_data" 65 | } 66 | ], 67 | "source": [ 68 | "G = nx.read_edgelist('edge_list_short.txt', nodetype=int, create_using=nx.DiGraph())\n", 69 | "labels = {0:'0', 1:'1', 2:'2', 3:'3', 4:'4'}\n", 70 | "nx.draw(G, labels=labels)" 71 | ] 72 | }, 73 | { 74 | "cell_type": "code", 75 | "execution_count": 21, 76 | "metadata": {}, 77 | "outputs": [ 78 | { 79 | "data": { 80 | "text/plain": [ 81 | "" 82 | ] 83 | }, 84 | "execution_count": 21, 85 | "metadata": {}, 86 | "output_type": "execute_result" 87 | } 88 | ], 89 | "source": [ 90 | "G" 91 | ] 92 | }, 93 | { 94 | "cell_type": "code", 95 | "execution_count": 22, 96 | "metadata": {}, 97 | "outputs": [ 98 | { 99 | "data": { 100 | "text/plain": [ 101 | "[3, 4, 0]" 102 | ] 103 | }, 104 | "execution_count": 22, 105 | "metadata": {}, 106 | "output_type": "execute_result" 107 | } 108 | ], 109 | "source": [ 110 | "nx.shortest_path(G, 3, 0)" 111 | ] 112 | }, 113 | { 114 | "cell_type": "code", 115 | "execution_count": 23, 116 | "metadata": {}, 117 | "outputs": [ 118 | { 119 | "name": "stdout", 120 | "output_type": "stream", 121 | "text": [ 122 | "[0, 2, 1, 4]\n", 123 | "[0, 2, 1, 3, 4]\n", 124 | "[0, 2]\n", 125 | "[0, 2, 4]\n", 126 | "[0, 1, 4]\n", 127 | "[0, 1, 3, 4]\n", 128 | "[0, 1, 2]\n", 129 | "[0, 1, 2, 4]\n", 130 | "[1, 4, 3]\n", 131 | "[1, 3]\n", 132 | "[1, 2]\n", 133 | "[1, 2, 4, 3]\n", 134 | "[3, 4]\n" 135 | ] 136 | } 137 | ], 138 | "source": [ 139 | "for cycle in nx.simple_cycles(G):\n", 140 | " print(cycle)" 141 | ] 142 | }, 143 | { 144 | "cell_type": "code", 145 | "execution_count": 24, 146 | "metadata": {}, 147 | "outputs": [ 148 | { 149 | "data": { 150 | "text/plain": [ 151 | "[2, 3, 4]" 152 | ] 153 | }, 154 | "execution_count": 24, 155 | "metadata": {}, 156 | "output_type": "execute_result" 157 | } 158 | ], 159 | "source": [ 160 | "list(G.neighbors(1))" 161 | ] 162 | }, 163 | { 164 | "cell_type": "code", 165 | "execution_count": 31, 166 | "metadata": {}, 167 | "outputs": [ 168 | { 169 | "data": { 170 | "text/plain": [ 171 | "OutEdgeView([(0, 1), (0, 2), (1, 2), (1, 3), (1, 4), (2, 4), (2, 0), (2, 1), (3, 4), (3, 1), (4, 3), (4, 0)])" 172 | ] 173 | }, 174 | "execution_count": 31, 175 | "metadata": {}, 176 | "output_type": "execute_result" 177 | } 178 | ], 179 | "source": [ 180 | "G.edges()" 181 | ] 182 | }, 183 | { 184 | "cell_type": "code", 185 | "execution_count": 8, 186 | "metadata": {}, 187 | "outputs": [], 188 | "source": [ 189 | "c = 0\n", 190 | "for edge in G.edges():\n", 191 | " G[edge[0]][edge[1]]['weight'] = c\n", 192 | " c = c+1\n" 193 | ] 194 | }, 195 | { 196 | "cell_type": "code", 197 | "execution_count": 9, 198 | "metadata": {}, 199 | "outputs": [], 200 | "source": [ 201 | "for i in range(5):\n", 202 | " G.nodes[i]['value'] = 3.14+i" 203 | ] 204 | }, 205 | { 206 | "cell_type": "code", 207 | "execution_count": 16, 208 | "metadata": {}, 209 | "outputs": [], 210 | "source": [ 211 | "dG = dgl.DGLGraph()\n", 212 | "dG.from_networkx(G, node_attrs=['value'], edge_attrs=['weight'])" 213 | ] 214 | }, 215 | { 216 | "cell_type": "code", 217 | "execution_count": 17, 218 | "metadata": {}, 219 | "outputs": [ 220 | { 221 | "data": { 222 | "text/plain": [ 223 | "DGLGraph(num_nodes=5, num_edges=12,\n", 224 | " ndata_schemes={'value': Scheme(shape=(), dtype=torch.float32)}\n", 225 | " edata_schemes={'weight': Scheme(shape=(), dtype=torch.int64)})" 226 | ] 227 | }, 228 | "execution_count": 17, 229 | "metadata": {}, 230 | "output_type": "execute_result" 231 | } 232 | ], 233 | "source": [ 234 | "dG" 235 | ] 236 | }, 237 | { 238 | "cell_type": "code", 239 | "execution_count": 18, 240 | "metadata": {}, 241 | "outputs": [ 242 | { 243 | "data": { 244 | "text/plain": [ 245 | "tensor([ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11])" 246 | ] 247 | }, 248 | "execution_count": 18, 249 | "metadata": {}, 250 | "output_type": "execute_result" 251 | } 252 | ], 253 | "source": [ 254 | "dG.edata['weight']" 255 | ] 256 | }, 257 | { 258 | "cell_type": "code", 259 | "execution_count": 19, 260 | "metadata": {}, 261 | "outputs": [ 262 | { 263 | "data": { 264 | "text/plain": [ 265 | "tensor([3.1400, 4.1400, 5.1400, 6.1400, 7.1400])" 266 | ] 267 | }, 268 | "execution_count": 19, 269 | "metadata": {}, 270 | "output_type": "execute_result" 271 | } 272 | ], 273 | "source": [ 274 | "dG.ndata['value']" 275 | ] 276 | }, 277 | { 278 | "cell_type": "code", 279 | "execution_count": 33, 280 | "metadata": {}, 281 | "outputs": [ 282 | { 283 | "data": { 284 | "text/plain": [ 285 | "tensor([2, 3, 3, 2, 2])" 286 | ] 287 | }, 288 | "execution_count": 33, 289 | "metadata": {}, 290 | "output_type": "execute_result" 291 | } 292 | ], 293 | "source": [ 294 | "dG.out_degrees()" 295 | ] 296 | }, 297 | { 298 | "cell_type": "code", 299 | "execution_count": 45, 300 | "metadata": {}, 301 | "outputs": [ 302 | { 303 | "data": { 304 | "text/plain": [ 305 | "tensor([2, 3, 2, 2, 3])" 306 | ] 307 | }, 308 | "execution_count": 45, 309 | "metadata": {}, 310 | "output_type": "execute_result" 311 | } 312 | ], 313 | "source": [ 314 | "dG.in_degrees()" 315 | ] 316 | }, 317 | { 318 | "cell_type": "code", 319 | "execution_count": 65, 320 | "metadata": {}, 321 | "outputs": [], 322 | "source": [ 323 | "dG.ndata['one'] = th.torch.ones(5)\n", 324 | "dG.ndata['deg'] = dG.in_degrees().float()" 325 | ] 326 | }, 327 | { 328 | "cell_type": "code", 329 | "execution_count": 66, 330 | "metadata": {}, 331 | "outputs": [ 332 | { 333 | "data": { 334 | "text/plain": [ 335 | "tensor([2., 3., 2., 2., 3.])" 336 | ] 337 | }, 338 | "execution_count": 66, 339 | "metadata": {}, 340 | "output_type": "execute_result" 341 | } 342 | ], 343 | "source": [ 344 | "dG.ndata['deg']" 345 | ] 346 | }, 347 | { 348 | "cell_type": "code", 349 | "execution_count": 83, 350 | "metadata": {}, 351 | "outputs": [], 352 | "source": [ 353 | "def message_func(edges):\n", 354 | " return {'x' : 2*edges.src['one'] }\n", 355 | "\n", 356 | "def reduce_func(nodes):\n", 357 | " tot = th.torch.sum(nodes.mailbox['x'], dim=1)\n", 358 | " tot = tot+nodes.data['deg']\n", 359 | " return {'tot' : tot}" 360 | ] 361 | }, 362 | { 363 | "cell_type": "code", 364 | "execution_count": 84, 365 | "metadata": {}, 366 | "outputs": [], 367 | "source": [ 368 | "dG.register_message_func(message_func)\n", 369 | "dG.register_reduce_func(reduce_func)" 370 | ] 371 | }, 372 | { 373 | "cell_type": "code", 374 | "execution_count": 85, 375 | "metadata": {}, 376 | "outputs": [], 377 | "source": [ 378 | "dG.send(dG.edges())\n", 379 | "dG.recv(dG.nodes())" 380 | ] 381 | }, 382 | { 383 | "cell_type": "code", 384 | "execution_count": 86, 385 | "metadata": {}, 386 | "outputs": [ 387 | { 388 | "data": { 389 | "text/plain": [ 390 | "tensor([6., 9., 6., 6., 9.])" 391 | ] 392 | }, 393 | "execution_count": 86, 394 | "metadata": {}, 395 | "output_type": "execute_result" 396 | } 397 | ], 398 | "source": [ 399 | "dG.ndata['tot']" 400 | ] 401 | }, 402 | { 403 | "cell_type": "code", 404 | "execution_count": 91, 405 | "metadata": {}, 406 | "outputs": [ 407 | { 408 | "name": "stdout", 409 | "output_type": "stream", 410 | "text": [ 411 | "tensor([0., 0., 0., 0., 0.])\n" 412 | ] 413 | } 414 | ], 415 | "source": [ 416 | "dG.ndata['tot'] = th.zeros(5)\n", 417 | "print(dG.ndata['tot'])\n", 418 | "dG.update_all()" 419 | ] 420 | }, 421 | { 422 | "cell_type": "code", 423 | "execution_count": 92, 424 | "metadata": {}, 425 | "outputs": [ 426 | { 427 | "data": { 428 | "text/plain": [ 429 | "tensor([6., 9., 6., 6., 9.])" 430 | ] 431 | }, 432 | "execution_count": 92, 433 | "metadata": {}, 434 | "output_type": "execute_result" 435 | } 436 | ], 437 | "source": [ 438 | "dG.ndata['tot']" 439 | ] 440 | } 441 | ], 442 | "metadata": { 443 | "kernelspec": { 444 | "display_name": "Python 3", 445 | "language": "python", 446 | "name": "python3" 447 | }, 448 | "language_info": { 449 | "codemirror_mode": { 450 | "name": "ipython", 451 | "version": 3 452 | }, 453 | "file_extension": ".py", 454 | "mimetype": "text/x-python", 455 | "name": "python", 456 | "nbconvert_exporter": "python", 457 | "pygments_lexer": "ipython3", 458 | "version": "3.7.4" 459 | } 460 | }, 461 | "nbformat": 4, 462 | "nbformat_minor": 2 463 | } 464 | -------------------------------------------------------------------------------- /GCN_hetero.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Graph Convolutional Netoworks and the ACM Heterogenous Graph\n", 8 | "this is a slightly modified version of the notebook from the DGL tutorial\n", 9 | "https://docs.dgl.ai/en/0.4.x/tutorials/hetero/1_basics.html\n" 10 | ] 11 | }, 12 | { 13 | "cell_type": "code", 14 | "execution_count": 1, 15 | "metadata": {}, 16 | "outputs": [], 17 | "source": [ 18 | "%matplotlib inline" 19 | ] 20 | }, 21 | { 22 | "cell_type": "markdown", 23 | "metadata": {}, 24 | "source": [ 25 | "\n", 26 | ".. currentmodule:: dgl\n", 27 | "\n", 28 | "Working with Heterogeneous Graphs\n", 29 | "=================================\n", 30 | "\n", 31 | "**Author**: Quan Gan, `Minjie Wang `_, Mufei Li,\n", 32 | "George Karypis, Zheng Zhang\n", 33 | "\n", 34 | "In this tutorial, you learn about:\n", 35 | "\n", 36 | "* Examples of heterogenous graph data and typical applications.\n", 37 | "\n", 38 | "* Creating and manipulating a heterogenous graph in DGL.\n", 39 | "\n", 40 | "* Implementing `Relational-GCN `_, a popular GNN model,\n", 41 | " for heterogenous graph input.\n", 42 | "\n", 43 | "* Training a model to solve a node classification task.\n", 44 | "\n", 45 | "Heterogeneous graphs, or *heterographs* for short, are graphs that contain\n", 46 | "different types of nodes and edges. The different types of nodes and edges tend\n", 47 | "to have different types of attributes that are designed to capture the\n", 48 | "characteristics of each node and edge type. Within the context of\n", 49 | "graph neural networks, depending on their complexity, certain node and edge types\n", 50 | "might need to be modeled with representations that have a different number of dimensions.\n", 51 | "\n", 52 | "DGL supports graph neural network computations on such heterogeneous graphs, by\n", 53 | "using the heterograph class and its associated API.\n" 54 | ] 55 | }, 56 | { 57 | "cell_type": "markdown", 58 | "metadata": {}, 59 | "source": [ 60 | "Examples of heterographs\n", 61 | "-----------------------\n", 62 | "Many graph datasets represent relationships among various types of entities.\n", 63 | "This section provides an overview for several graph use-cases that show such relationships \n", 64 | "and can have their data represented as heterographs.\n", 65 | "\n", 66 | "Citation graph \n", 67 | "~~~~~~~~~~~~~~~\n", 68 | "The Association for Computing Machinery publishes an `ACM dataset `_ that contains two\n", 69 | "million papers, their authors, publication venues, and the other papers\n", 70 | "that were cited. This information can be represented as a heterogeneous graph.\n", 71 | "\n", 72 | "The following diagram shows several entities in the ACM dataset and the relationships among them \n", 73 | "(taken from `Shi et al., 2015 `_).\n", 74 | "\n", 75 | ".. figure:: https://data.dgl.ai/tutorial/hetero/acm-example.png# \n", 76 | "\n", 77 | "This graph has three types of entities that correspond to papers, authors, and publication venues.\n", 78 | "It also contains three types of edges that connect the following:\n", 79 | "\n", 80 | "* Authors with papers corresponding to *written-by* relationships\n", 81 | "\n", 82 | "* Papers with publication venues corresponding to *published-in* relationships\n", 83 | "\n", 84 | "* Papers with other papers corresponding to *cited-by* relationships\n", 85 | "\n", 86 | "\n", 87 | "Recommender systems \n", 88 | "~~~~~~~~~~~~~~~~~~~~ \n", 89 | "The datasets used in recommender systems often contain\n", 90 | "interactions between users and items. For example, the data could include the\n", 91 | "ratings that users have provided to movies. Such interactions can be modeled\n", 92 | "as heterographs.\n", 93 | "\n", 94 | "The nodes in these heterographs will have two types, *users* and *movies*. The edges\n", 95 | "will correspond to the user-movie interactions. Furthermore, if an interaction is\n", 96 | "marked with a rating, then each rating value could correspond to a different edge type.\n", 97 | "The following diagram shows an example of user-item interactions as a heterograph.\n", 98 | "\n", 99 | ".. figure:: https://data.dgl.ai/tutorial/hetero/recsys-example.png\n", 100 | "\n", 101 | "\n", 102 | "Knowledge graph \n", 103 | "~~~~~~~~~~~~~~~~\n", 104 | "Knowledge graphs are inherently heterogenous. For example, in\n", 105 | "Wikidata, Barack Obama (item Q76) is an instance of a human, which could be viewed as\n", 106 | "the entity class, whose spouse (item P26) is Michelle Obama (item Q13133) and\n", 107 | "occupation (item P106) is politician (item Q82955). The relationships are shown in the following.\n", 108 | "diagram.\n", 109 | "\n", 110 | ".. figure:: https://data.dgl.ai/tutorial/hetero/kg-example.png\n", 111 | "\n", 112 | "\n" 113 | ] 114 | }, 115 | { 116 | "cell_type": "markdown", 117 | "metadata": {}, 118 | "source": [ 119 | "Creating a heterograph in DGL\n", 120 | "-----------------------------\n", 121 | "You can create a heterograph in DGL using the :func:`dgl.heterograph` API.\n", 122 | "The argument to :func:`dgl.heterograph` is a dictionary. The keys are tuples\n", 123 | "in the form of ``(srctype, edgetype, dsttype)`` specifying the relation name\n", 124 | "and the two entity types it connects. Such tuples are called *canonical edge\n", 125 | "types*. The values are data to initialize the graph structures, that is, which\n", 126 | "nodes the edges actually connect.\n", 127 | "\n", 128 | "For instance, the following code creates the user-item interactions heterograph shown earlier.\n", 129 | "\n" 130 | ] 131 | }, 132 | { 133 | "cell_type": "code", 134 | "execution_count": 2, 135 | "metadata": {}, 136 | "outputs": [ 137 | { 138 | "name": "stderr", 139 | "output_type": "stream", 140 | "text": [ 141 | "Using backend: pytorch\n" 142 | ] 143 | } 144 | ], 145 | "source": [ 146 | "# Each value of the dictionary is a pair of source and destination arrays.\n", 147 | "# Nodes are integer IDs starting from zero. Nodes IDs of different types have\n", 148 | "# separate countings.\n", 149 | "import dgl\n", 150 | "import numpy as np\n" 151 | ] 152 | }, 153 | { 154 | "cell_type": "markdown", 155 | "metadata": {}, 156 | "source": [ 157 | "DGL supports creating a graph from a variety of data sources. The following\n", 158 | "code creates the same graph as the above.\n", 159 | "\n", 160 | "Creating from scipy matrix\n", 161 | "\n" 162 | ] 163 | }, 164 | { 165 | "cell_type": "code", 166 | "execution_count": 3, 167 | "metadata": {}, 168 | "outputs": [], 169 | "source": [ 170 | "import scipy.sparse as sp\n", 171 | "# Creating from networkx graph\n", 172 | "import networkx as nx\n" 173 | ] 174 | }, 175 | { 176 | "cell_type": "markdown", 177 | "metadata": {}, 178 | "source": [ 179 | "Manipulating heterograph\n", 180 | "------------------------\n", 181 | "You can create a more realistic heterograph using the ACM dataset. To do this, first \n", 182 | "download the dataset as follows:\n", 183 | "\n" 184 | ] 185 | }, 186 | { 187 | "cell_type": "code", 188 | "execution_count": 4, 189 | "metadata": {}, 190 | "outputs": [ 191 | { 192 | "name": "stdout", 193 | "output_type": "stream", 194 | "text": [ 195 | "['__header__', '__version__', '__globals__', 'TvsP', 'PvsA', 'PvsV', 'AvsF', 'VvsC', 'PvsL', 'PvsC', 'A', 'C', 'F', 'L', 'P', 'T', 'V', 'PvsT', 'CNormPvsA', 'RNormPvsA', 'CNormPvsC', 'RNormPvsC', 'CNormPvsT', 'RNormPvsT', 'CNormPvsV', 'RNormPvsV', 'CNormVvsC', 'RNormVvsC', 'CNormAvsF', 'RNormAvsF', 'CNormPvsL', 'RNormPvsL', 'stopwords', 'nPvsT', 'nT', 'CNormnPvsT', 'RNormnPvsT', 'nnPvsT', 'nnT', 'CNormnnPvsT', 'RNormnnPvsT', 'PvsP', 'CNormPvsP', 'RNormPvsP']\n" 196 | ] 197 | } 198 | ], 199 | "source": [ 200 | "import scipy.io\n", 201 | "import urllib.request\n", 202 | "\n", 203 | "data_url = 'https://data.dgl.ai/dataset/ACM.mat'\n", 204 | "data_file_path = 'ACM.mat'\n", 205 | "\n", 206 | "urllib.request.urlretrieve(data_url, data_file_path)\n", 207 | "data = scipy.io.loadmat(data_file_path)\n", 208 | "print(list(data.keys()))" 209 | ] 210 | }, 211 | { 212 | "cell_type": "markdown", 213 | "metadata": {}, 214 | "source": [ 215 | "The dataset stores node information by their types: ``P`` for paper, ``A``\n", 216 | "for author, ``C`` for conference, ``L`` for subject code, and so on. The relationships\n", 217 | "are stored as SciPy sparse matrix under key ``XvsY``, where ``X`` and ``Y``\n", 218 | "could be any of the node type code.\n", 219 | "\n", 220 | "The following code prints out some statistics about the paper-author relationships.\n", 221 | "\n" 222 | ] 223 | }, 224 | { 225 | "cell_type": "code", 226 | "execution_count": 5, 227 | "metadata": {}, 228 | "outputs": [ 229 | { 230 | "name": "stdout", 231 | "output_type": "stream", 232 | "text": [ 233 | "\n", 234 | "#Papers: 12499\n", 235 | "#Authors: 17431\n", 236 | "#Links: 37055\n" 237 | ] 238 | } 239 | ], 240 | "source": [ 241 | "print(type(data['PvsA']))\n", 242 | "print('#Papers:', data['PvsA'].shape[0])\n", 243 | "print('#Authors:', data['PvsA'].shape[1])\n", 244 | "print('#Links:', data['PvsA'].nnz)" 245 | ] 246 | }, 247 | { 248 | "cell_type": "markdown", 249 | "metadata": {}, 250 | "source": [ 251 | "Converting this SciPy matrix to a heterograph in DGL is straightforward.\n", 252 | "\n" 253 | ] 254 | }, 255 | { 256 | "cell_type": "markdown", 257 | "metadata": {}, 258 | "source": [ 259 | "Create a subset of the ACM graph using the paper-author, paper-paper, \n", 260 | "and paper-subject relationships. Meanwhile, also add the reverse\n", 261 | "relationship to prepare for the later sections.\n", 262 | "\n" 263 | ] 264 | }, 265 | { 266 | "cell_type": "code", 267 | "execution_count": 6, 268 | "metadata": {}, 269 | "outputs": [ 270 | { 271 | "data": { 272 | "text/plain": [ 273 | "Graph(num_nodes={'author': 17431, 'paper': 12499, 'subject': 73},\n", 274 | " num_edges={('paper', 'written-by', 'author'): 37055, ('author', 'writing', 'paper'): 37055, ('paper', 'citing', 'paper'): 30789, ('paper', 'cited', 'paper'): 30789, ('paper', 'is-about', 'subject'): 12499, ('subject', 'has', 'paper'): 12499},\n", 275 | " metagraph=[('author', 'paper'), ('paper', 'author'), ('paper', 'paper'), ('paper', 'paper'), ('paper', 'subject'), ('subject', 'paper')])" 276 | ] 277 | }, 278 | "execution_count": 6, 279 | "metadata": {}, 280 | "output_type": "execute_result" 281 | } 282 | ], 283 | "source": [ 284 | "G = dgl.heterograph({\n", 285 | " ('paper', 'written-by', 'author') : data['PvsA'],\n", 286 | " ('author', 'writing', 'paper') : data['PvsA'].transpose(),\n", 287 | " ('paper', 'citing', 'paper') : data['PvsP'],\n", 288 | " ('paper', 'cited', 'paper') : data['PvsP'].transpose(),\n", 289 | " ('paper', 'is-about', 'subject') : data['PvsL'],\n", 290 | " ('subject', 'has', 'paper') : data['PvsL'].transpose(),\n", 291 | " })\n", 292 | "G" 293 | ] 294 | }, 295 | { 296 | "cell_type": "markdown", 297 | "metadata": {}, 298 | "source": [ 299 | "**Metagraph** (or network schema) is a useful summary of a heterograph.\n", 300 | "Serving as a template for a heterograph, it tells how many types of objects\n", 301 | "exist in the network and where the possible links exist.\n", 302 | "\n", 303 | "DGL provides easy access to the metagraph, which could be visualized using\n", 304 | "external tools.\n", 305 | "\n" 306 | ] 307 | }, 308 | { 309 | "cell_type": "code", 310 | "execution_count": 7, 311 | "metadata": {}, 312 | "outputs": [], 313 | "source": [ 314 | "import matplotlib.pyplot as plt\n" 315 | ] 316 | }, 317 | { 318 | "cell_type": "markdown", 319 | "metadata": {}, 320 | "source": [ 321 | "Learning tasks associated with heterographs\n", 322 | "-------------------------------------------\n", 323 | "Some of the typical learning tasks that involve heterographs include:\n", 324 | "\n", 325 | "* *Node classification and regression* to predict the class of each node or\n", 326 | " estimate a value associated with it.\n", 327 | "\n", 328 | "* *Link prediction* to predict if there is an edge of a certain\n", 329 | " type between a pair of nodes, or predict which other nodes a particular\n", 330 | " node is connected with (and optionally the edge types of such connections).\n", 331 | "\n", 332 | "* *Graph classification/regression* to assign an entire\n", 333 | " heterograph into one of the target classes or to estimate a numerical\n", 334 | " value associated with it.\n", 335 | "\n", 336 | "In this tutorial, we designed a simple example for the first task.\n", 337 | "\n", 338 | "A semi-supervised node classification example\n", 339 | "~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~\n", 340 | "Our goal is to predict the publishing conference of a paper using the ACM\n", 341 | "academic graph we just created. To further simplify the task, we only focus\n", 342 | "on papers published in three conferences: *KDD*, *ICML*, and *VLDB*. All\n", 343 | "the other papers are not labeled, making it a semi-supervised setting.\n", 344 | "\n", 345 | "The following code extracts those papers from the raw dataset and prepares \n", 346 | "the training, validation, testing split.\n", 347 | "\n", 348 | "Note: in this version we look at 4 conferences: SOSP, SODA, Sigcom and VLDB." 349 | ] 350 | }, 351 | { 352 | "cell_type": "code", 353 | "execution_count": 83, 354 | "metadata": {}, 355 | "outputs": [], 356 | "source": [ 357 | "import numpy as np\n", 358 | "import torch\n", 359 | "import torch.nn as nn\n", 360 | "import torch.nn.functional as F\n", 361 | "\n", 362 | "pvc = data['PvsC'].tocsr()\n", 363 | "# sosp = 7\n", 364 | "# soda = 5\n", 365 | "# sigcom = 9\n", 366 | "# vldb = 13\n", 367 | "c_selected = [7, 5, 9, 13] \n", 368 | "\n", 369 | "p_selected = pvc[:, c_selected].tocoo()\n", 370 | "# remake 7,5,9,13 labels as 0,1,2,3\n", 371 | "labels = pvc.indices\n", 372 | "labels[labels==0] = 13\n", 373 | "labels[labels==7] = 0\n", 374 | "labels[labels==1] = 13\n", 375 | "labels[labels == 5] = 1\n", 376 | "labels[labels==2] = 13\n", 377 | "labels[labels == 9]= 2\n", 378 | "labels[labels == 3] = 13\n", 379 | "labels[labels == 13] = 3\n", 380 | "labels = torch.tensor(labels).long()\n", 381 | "\n", 382 | "# generate train/val/test split\n", 383 | "pid = p_selected.row\n", 384 | "shuffle = np.random.permutation(pid)\n", 385 | "\n", 386 | "train_idx = torch.tensor(shuffle[0:1400]).long()\n", 387 | "val_idx = torch.tensor(shuffle[1400:1500]).long()\n", 388 | "test_idx = torch.tensor(shuffle[1500:]).long()" 389 | ] 390 | }, 391 | { 392 | "cell_type": "code", 393 | "execution_count": null, 394 | "metadata": {}, 395 | "outputs": [], 396 | "source": [] 397 | }, 398 | { 399 | "cell_type": "code", 400 | "execution_count": 84, 401 | "metadata": {}, 402 | "outputs": [ 403 | { 404 | "name": "stdout", 405 | "output_type": "stream", 406 | "text": [ 407 | "332 662 648\n" 408 | ] 409 | } 410 | ], 411 | "source": [ 412 | "print( len(labels[labels==0]), len(labels[labels==1]), len(labels[labels==2]))" 413 | ] 414 | }, 415 | { 416 | "cell_type": "code", 417 | "execution_count": 85, 418 | "metadata": {}, 419 | "outputs": [ 420 | { 421 | "name": "stdout", 422 | "output_type": "stream", 423 | "text": [ 424 | "1400 719\n" 425 | ] 426 | } 427 | ], 428 | "source": [ 429 | "print(len(train_idx), len(test_idx))" 430 | ] 431 | }, 432 | { 433 | "cell_type": "markdown", 434 | "metadata": {}, 435 | "source": [ 436 | "Relational-GCN on heterograph\n", 437 | "~~~~~~~~~~~~~~~~~~~~~~~~~~~~~\n", 438 | "We use `Relational-GCN `_ to learn the\n", 439 | "representation of nodes in the graph. Its message-passing equation is as\n", 440 | "follows:\n", 441 | "for each message type we will have a fully connected layer of trainable parameters W. Then for \n", 442 | "for each node and \n", 443 | "each edge type we compute\n", 444 | "\n", 445 | "\\begin{align} \\sum_{j\\in\\mathcal{N}_r(i)} W_r^{(l)}h_j^{(l)} \\end{align}\n", 446 | "\n", 447 | "following that sum over each edge type and apply sigma\n", 448 | "\n", 449 | "\\begin{align}h_i^{(l+1)} = \\sigma\\left(\\sum_{r\\in \\mathcal{R}}\n", 450 | " \\sum_{j\\in\\mathcal{N}_r(i)}W_r^{(l)}h_j^{(l)}\\right)\\end{align}\n", 451 | "\n", 452 | "Breaking down the equation, you see that there are two parts in the\n", 453 | "computation.\n", 454 | "\n", 455 | "(i) Message computation and aggregation within each relation $r$\n", 456 | "\n", 457 | "(ii) Reduction that merges the results from multiple relationships\n", 458 | "\n", 459 | "Following this intuition, perform message passing on a heterograph in\n", 460 | "two steps.\n", 461 | "\n", 462 | "(i) Per-edge-type message passing\n", 463 | "\n", 464 | "(ii) Type wise reduction\n", 465 | "\n" 466 | ] 467 | }, 468 | { 469 | "cell_type": "code", 470 | "execution_count": 86, 471 | "metadata": {}, 472 | "outputs": [], 473 | "source": [ 474 | "import dgl.function as fn\n", 475 | "\n", 476 | "class HeteroRGCNLayer(nn.Module):\n", 477 | " def __init__(self, in_size, out_size, etypes):\n", 478 | " super(HeteroRGCNLayer, self).__init__()\n", 479 | " # W_r for each relation\n", 480 | " self.weight = nn.ModuleDict({\n", 481 | " name : nn.Linear(in_size, out_size) for name in etypes\n", 482 | " })\n", 483 | "\n", 484 | " def forward(self, G, feat_dict):\n", 485 | " # The input is a dictionary of node features for each type\n", 486 | " funcs = {}\n", 487 | " for srctype, etype, dsttype in G.canonical_etypes:\n", 488 | " # Compute W_r * h\n", 489 | " Wh = self.weight[etype](feat_dict[srctype])\n", 490 | " # Save it in graph for message passing\n", 491 | " G.nodes[srctype].data['Wh_%s' % etype] = Wh\n", 492 | " # Specify per-relation message passing functions: (message_func, reduce_func).\n", 493 | " # Note that the results are saved to the same destination feature 'h', which\n", 494 | " # hints the type wise reducer for aggregation.\n", 495 | " funcs[etype] = (fn.copy_u('Wh_%s' % etype, 'm'), fn.mean('m', 'h'))\n", 496 | " # Trigger message passing of multiple types.\n", 497 | " # The first argument is the message passing functions for each relation.\n", 498 | " # The second one is the type wise reducer, could be \"sum\", \"max\",\n", 499 | " # \"min\", \"mean\", \"stack\"\n", 500 | " G.multi_update_all(funcs, 'sum')\n", 501 | " # return the updated node feature dictionary\n", 502 | " return {ntype : G.nodes[ntype].data['h'] for ntype in G.ntypes}" 503 | ] 504 | }, 505 | { 506 | "cell_type": "markdown", 507 | "metadata": {}, 508 | "source": [ 509 | "Create a simple GNN by stacking two ``HeteroRGCNLayer``. Since the\n", 510 | "nodes do not have input features, make their embeddings trainable.\n", 511 | "\n" 512 | ] 513 | }, 514 | { 515 | "cell_type": "code", 516 | "execution_count": 87, 517 | "metadata": {}, 518 | "outputs": [ 519 | { 520 | "data": { 521 | "text/plain": [ 522 | "[('paper', 'written-by', 'author'),\n", 523 | " ('author', 'writing', 'paper'),\n", 524 | " ('paper', 'citing', 'paper'),\n", 525 | " ('paper', 'cited', 'paper'),\n", 526 | " ('paper', 'is-about', 'subject'),\n", 527 | " ('subject', 'has', 'paper')]" 528 | ] 529 | }, 530 | "execution_count": 87, 531 | "metadata": {}, 532 | "output_type": "execute_result" 533 | } 534 | ], 535 | "source": [ 536 | "G.canonical_etypes" 537 | ] 538 | }, 539 | { 540 | "cell_type": "code", 541 | "execution_count": 88, 542 | "metadata": {}, 543 | "outputs": [ 544 | { 545 | "data": { 546 | "text/plain": [ 547 | "Graph(num_nodes={'author': 17431, 'paper': 12499, 'subject': 73},\n", 548 | " num_edges={('paper', 'written-by', 'author'): 37055, ('author', 'writing', 'paper'): 37055, ('paper', 'citing', 'paper'): 30789, ('paper', 'cited', 'paper'): 30789, ('paper', 'is-about', 'subject'): 12499, ('subject', 'has', 'paper'): 12499},\n", 549 | " metagraph=[('author', 'paper'), ('paper', 'author'), ('paper', 'paper'), ('paper', 'paper'), ('paper', 'subject'), ('subject', 'paper')])" 550 | ] 551 | }, 552 | "execution_count": 88, 553 | "metadata": {}, 554 | "output_type": "execute_result" 555 | } 556 | ], 557 | "source": [ 558 | "G" 559 | ] 560 | }, 561 | { 562 | "cell_type": "code", 563 | "execution_count": 89, 564 | "metadata": {}, 565 | "outputs": [ 566 | { 567 | "data": { 568 | "text/plain": [ 569 | "['author', 'paper', 'subject']" 570 | ] 571 | }, 572 | "execution_count": 89, 573 | "metadata": {}, 574 | "output_type": "execute_result" 575 | } 576 | ], 577 | "source": [ 578 | "G.ntypes" 579 | ] 580 | }, 581 | { 582 | "cell_type": "code", 583 | "execution_count": 90, 584 | "metadata": {}, 585 | "outputs": [ 586 | { 587 | "data": { 588 | "text/plain": [ 589 | "ParameterDict(\n", 590 | " (author): Parameter containing: [torch.FloatTensor of size 17431x10]\n", 591 | " (paper): Parameter containing: [torch.FloatTensor of size 12499x10]\n", 592 | " (subject): Parameter containing: [torch.FloatTensor of size 73x10]\n", 593 | ")" 594 | ] 595 | }, 596 | "execution_count": 90, 597 | "metadata": {}, 598 | "output_type": "execute_result" 599 | } 600 | ], 601 | "source": [ 602 | "embed_dict = {ntype : nn.Parameter(torch.Tensor(G.number_of_nodes(ntype), 10))\n", 603 | " for ntype in G.ntypes}\n", 604 | "for key, embed in embed_dict.items():\n", 605 | " nn.init.xavier_uniform_(embed)\n", 606 | "embed = nn.ParameterDict(embed_dict)\n", 607 | "embed" 608 | ] 609 | }, 610 | { 611 | "cell_type": "code", 612 | "execution_count": 91, 613 | "metadata": {}, 614 | "outputs": [], 615 | "source": [ 616 | "class HeteroRGCN(nn.Module):\n", 617 | " def __init__(self, G, in_size, hidden_size, out_size):\n", 618 | " super(HeteroRGCN, self).__init__()\n", 619 | " # Use trainable node embeddings as featureless inputs.\n", 620 | " embed_dict = {ntype : nn.Parameter(torch.Tensor(G.number_of_nodes(ntype), in_size))\n", 621 | " for ntype in G.ntypes}\n", 622 | " for key, embed in embed_dict.items():\n", 623 | " nn.init.xavier_uniform_(embed)\n", 624 | " self.embed = nn.ParameterDict(embed_dict)\n", 625 | " # create layers\n", 626 | " self.layer1 = HeteroRGCNLayer(in_size, hidden_size, G.etypes)\n", 627 | " self.layer2 = HeteroRGCNLayer(hidden_size, out_size, G.etypes)\n", 628 | "\n", 629 | " def forward(self, G):\n", 630 | " h_dict = self.layer1(G, self.embed)\n", 631 | " h_dict = {k : F.leaky_relu(h) for k, h in h_dict.items()}\n", 632 | " h_dict = self.layer2(G, h_dict)\n", 633 | " # get paper logits\n", 634 | " return h_dict['paper']" 635 | ] 636 | }, 637 | { 638 | "cell_type": "markdown", 639 | "metadata": {}, 640 | "source": [ 641 | "Train and evaluate\n", 642 | "~~~~~~~~~~~~~~~~~~\n", 643 | "Train and evaluate this network.\n", 644 | "\n" 645 | ] 646 | }, 647 | { 648 | "cell_type": "code", 649 | "execution_count": 92, 650 | "metadata": {}, 651 | "outputs": [ 652 | { 653 | "name": "stdout", 654 | "output_type": "stream", 655 | "text": [ 656 | "Loss 1.4772, Train Acc 0.2371, Val Acc 0.2300 (Best 0.2300), Test Acc 0.2281 (Best 0.2281)\n", 657 | "Loss 1.2481, Train Acc 0.6450, Val Acc 0.5300 (Best 0.5300), Test Acc 0.5410 (Best 0.5410)\n", 658 | "Loss 1.0722, Train Acc 0.7607, Val Acc 0.5800 (Best 0.5800), Test Acc 0.6203 (Best 0.6203)\n", 659 | "Loss 0.8221, Train Acc 0.8436, Val Acc 0.7400 (Best 0.7500), Test Acc 0.7955 (Best 0.7747)\n", 660 | "Loss 0.5720, Train Acc 0.8893, Val Acc 0.8100 (Best 0.8100), Test Acc 0.8150 (Best 0.8150)\n", 661 | "Loss 0.3809, Train Acc 0.9586, Val Acc 0.8600 (Best 0.8600), Test Acc 0.8428 (Best 0.8428)\n", 662 | "Loss 0.2482, Train Acc 0.9857, Val Acc 0.8700 (Best 0.8700), Test Acc 0.8707 (Best 0.8554)\n", 663 | "Loss 0.1638, Train Acc 0.9929, Val Acc 0.8500 (Best 0.8700), Test Acc 0.8790 (Best 0.8554)\n", 664 | "Loss 0.1139, Train Acc 0.9950, Val Acc 0.8800 (Best 0.8800), Test Acc 0.8971 (Best 0.8971)\n", 665 | "Loss 0.0848, Train Acc 0.9964, Val Acc 0.8900 (Best 0.8900), Test Acc 0.9068 (Best 0.8985)\n", 666 | "Loss 0.0661, Train Acc 0.9986, Val Acc 0.8900 (Best 0.8900), Test Acc 0.9068 (Best 0.8985)\n", 667 | "Loss 0.0535, Train Acc 0.9993, Val Acc 0.8900 (Best 0.8900), Test Acc 0.8985 (Best 0.8985)\n", 668 | "Loss 0.0450, Train Acc 0.9993, Val Acc 0.8900 (Best 0.8900), Test Acc 0.8985 (Best 0.8985)\n", 669 | "Loss 0.0385, Train Acc 1.0000, Val Acc 0.8800 (Best 0.8900), Test Acc 0.9026 (Best 0.8985)\n", 670 | "Loss 0.0335, Train Acc 1.0000, Val Acc 0.8800 (Best 0.8900), Test Acc 0.8999 (Best 0.8985)\n", 671 | "Loss 0.0298, Train Acc 1.0000, Val Acc 0.8800 (Best 0.8900), Test Acc 0.8887 (Best 0.8985)\n", 672 | "Loss 0.0270, Train Acc 1.0000, Val Acc 0.8600 (Best 0.8900), Test Acc 0.8790 (Best 0.8985)\n", 673 | "Loss 0.0247, Train Acc 1.0000, Val Acc 0.8600 (Best 0.8900), Test Acc 0.8790 (Best 0.8985)\n", 674 | "Loss 0.0230, Train Acc 1.0000, Val Acc 0.8600 (Best 0.8900), Test Acc 0.8748 (Best 0.8985)\n", 675 | "Loss 0.0216, Train Acc 1.0000, Val Acc 0.8600 (Best 0.8900), Test Acc 0.8734 (Best 0.8985)\n" 676 | ] 677 | } 678 | ], 679 | "source": [ 680 | "# Create the model. The output has four logits for four classes.\n", 681 | "model = HeteroRGCN(G, 10, 10, 4)\n", 682 | "\n", 683 | "opt = torch.optim.Adam(model.parameters(), lr=0.01, weight_decay=5e-4)\n", 684 | "\n", 685 | "best_val_acc = 0\n", 686 | "best_test_acc = 0\n", 687 | "\n", 688 | "for epoch in range(100):\n", 689 | " logits = model(G)\n", 690 | " # The loss is computed only for labeled nodes.\n", 691 | " loss = F.cross_entropy(logits[train_idx], labels[train_idx])\n", 692 | "\n", 693 | " pred = logits.argmax(1)\n", 694 | " train_acc = (pred[train_idx] == labels[train_idx]).float().mean()\n", 695 | " val_acc = (pred[val_idx] == labels[val_idx]).float().mean()\n", 696 | " test_acc = (pred[test_idx] == labels[test_idx]).float().mean()\n", 697 | "\n", 698 | " if best_val_acc < val_acc:\n", 699 | " best_val_acc = val_acc\n", 700 | " best_test_acc = test_acc\n", 701 | "\n", 702 | " opt.zero_grad()\n", 703 | " loss.backward()\n", 704 | " opt.step()\n", 705 | "\n", 706 | " if epoch % 5 == 0:\n", 707 | " print('Loss %.4f, Train Acc %.4f, Val Acc %.4f (Best %.4f), Test Acc %.4f (Best %.4f)' % (\n", 708 | " loss.item(),\n", 709 | " train_acc.item(),\n", 710 | " val_acc.item(),\n", 711 | " best_val_acc.item(),\n", 712 | " test_acc.item(),\n", 713 | " best_test_acc.item(),\n", 714 | " ))" 715 | ] 716 | }, 717 | { 718 | "cell_type": "code", 719 | "execution_count": 93, 720 | "metadata": {}, 721 | "outputs": [ 722 | { 723 | "name": "stdout", 724 | "output_type": "stream", 725 | "text": [ 726 | "tensor(0.8707)\n" 727 | ] 728 | } 729 | ], 730 | "source": [ 731 | "logits = model(G)\n", 732 | "pred = logits.argmax(1)\n", 733 | "test_acc = (pred[test_idx] == labels[test_idx]).float().mean()\n", 734 | "print(test_acc)" 735 | ] 736 | }, 737 | { 738 | "cell_type": "code", 739 | "execution_count": 94, 740 | "metadata": {}, 741 | "outputs": [ 742 | { 743 | "name": "stdout", 744 | "output_type": "stream", 745 | "text": [ 746 | "[[array(['KDD'], dtype='\n", 915 | "\n", 928 | "\n", 929 | " \n", 930 | " \n", 931 | " \n", 932 | " \n", 933 | " \n", 934 | " \n", 935 | " \n", 936 | " \n", 937 | " \n", 938 | " \n", 939 | " \n", 940 | " \n", 941 | " \n", 942 | " \n", 943 | " \n", 944 | " \n", 945 | " \n", 946 | " \n", 947 | " \n", 948 | " \n", 949 | " \n", 950 | " \n", 951 | " \n", 952 | " \n", 953 | " \n", 954 | " \n", 955 | " \n", 956 | " \n", 957 | " \n", 958 | " \n", 959 | " \n", 960 | " \n", 961 | " \n", 962 | " \n", 963 | " \n", 964 | " \n", 965 | " \n", 966 | " \n", 967 | " \n", 968 | "
0123
sosp81.02.011.07.0
soda1.096.00.02.0
sigcom4.014.078.05.0
vldb1.09.00.091.0
\n", 969 | "" 970 | ], 971 | "text/plain": [ 972 | " 0 1 2 3\n", 973 | "sosp 81.0 2.0 11.0 7.0\n", 974 | "soda 1.0 96.0 0.0 2.0\n", 975 | "sigcom 4.0 14.0 78.0 5.0\n", 976 | "vldb 1.0 9.0 0.0 91.0" 977 | ] 978 | }, 979 | "execution_count": 101, 980 | "metadata": {}, 981 | "output_type": "execute_result" 982 | } 983 | ], 984 | "source": [ 985 | "import pandas as pd\n", 986 | "df = pd.DataFrame(mat, index =['sosp', 'soda', 'sigcom','vldb'])\n", 987 | "df" 988 | ] 989 | }, 990 | { 991 | "cell_type": "markdown", 992 | "metadata": {}, 993 | "source": [ 994 | "What's next?\n", 995 | "------------\n", 996 | "* Check out our full implementation in PyTorch\n", 997 | " `here `_.\n", 998 | "\n", 999 | "* We also provide the following model examples:\n", 1000 | "\n", 1001 | " * `Graph Convolutional Matrix Completion _`,\n", 1002 | " which we implement in MXNet\n", 1003 | " `here `_.\n", 1004 | "\n", 1005 | " * `Heterogeneous Graph Attention Network `_\n", 1006 | " requires transforming a heterograph into a homogeneous graph according to\n", 1007 | " a given metapath (i.e. a path template consisting of edge types). We\n", 1008 | " provide :func:`dgl.transform.metapath_reachable_graph` to do this. See full\n", 1009 | " implementation\n", 1010 | " `here `_.\n", 1011 | "\n", 1012 | " * `Metapath2vec `_ requires\n", 1013 | " generating random walk paths according to a given metapath. Please\n", 1014 | " refer to the full metapath2vec implementation\n", 1015 | " `here `_.\n", 1016 | "\n", 1017 | "* :doc:`Full heterograph API reference <../../api/python/heterograph>`.\n", 1018 | "\n" 1019 | ] 1020 | }, 1021 | { 1022 | "cell_type": "code", 1023 | "execution_count": null, 1024 | "metadata": {}, 1025 | "outputs": [], 1026 | "source": [] 1027 | } 1028 | ], 1029 | "metadata": { 1030 | "kernelspec": { 1031 | "display_name": "Python 3", 1032 | "language": "python", 1033 | "name": "python3" 1034 | }, 1035 | "language_info": { 1036 | "codemirror_mode": { 1037 | "name": "ipython", 1038 | "version": 3 1039 | }, 1040 | "file_extension": ".py", 1041 | "mimetype": "text/x-python", 1042 | "name": "python", 1043 | "nbconvert_exporter": "python", 1044 | "pygments_lexer": "ipython3", 1045 | "version": "3.7.4" 1046 | } 1047 | }, 1048 | "nbformat": 4, 1049 | "nbformat_minor": 1 1050 | } 1051 | --------------------------------------------------------------------------------