Merge pull request #6 from jermainewang/doc

Doc

Merge pull request #6 from jermainewang/doc
Doc
4d7b3ba8 · VoVAllen · GitHub · 9628481f · 9e92fe74 · 4d7b3ba8
Unverified Commit 4d7b3ba8 authored Oct 23, 2018 by VoVAllen Committed by GitHub Oct 23, 2018
11 changed files
--- a/README.md
+++ b/README.md
@@ -2,62 +2,6 @@
 [![Build Status](http://216.165.71.225:8080/buildStatus/icon?job=DGL/master)](http://216.165.71.225:8080/job/DGL/job/master/)
 [![GitHub license](https://dmlc.github.io/img/apache2.svg)](./LICENSE)
-## Architecture
-Show below, there are three sets of APIs for different models.
- `update_all`, `proppagate` are more global
- `update_by_edge`, `update_to` and `update_from` give finer control when updates are applied to a path, or a group of nodes
- `sendto` and `recvfrom` are the bottom primitives that update a message and node.
-![Screenshot](graph-api.png)
+For how to install and how to play with DGL, please read our
+[Documentation](http://216.165.71.225:23232/index.html)
-## For Model developers
- Always choose the API at the *highest* possible level.
- Refer to the [GCN example](examples/pytorch/gcn/gcn_batch.py) to see how to register message and node update functions;
-## How to build (the `cpp` branch)
-Before building, make sure that the submodules are cloned.  If you haven't initialized the submodules, run
-```sh
-$ git submodule init
-```
-To sync the submodules, run
-```sh
-$ git submodule update
-```
-### Linux
-At the root directory of the repo:
-```sh
-$ mkdir build
-$ cd build
-$ cmake ..
-$ make
-$ export DGL_LIBRARY_PATH=$PWD
-```
-The `DGL_LIBRARY_PATH` environment variable should point to the library `libdgl.so` built by CMake.
-### Windows/MinGW (Experimental)
-Make sure you have the following installed:
-* CMake
-* MinGW/GCC (G++)
-* MinGW/Make
-You can grab them from Anaconda.
-In the command line prompt, run:
-```
-> md build
-> cd build
-> cmake -DCMAKE_CXX_FLAGS="-DDMLC_LOG_STACK_TRACE=0 -DTVM_EXPORTS" .. -G "MinGW Makefiles"
-> mingw32-make
-> set DGL_LIBRARY_PATH=%CD%
-```
--- a/docs/.gitignore
+++ b/docs/.gitignore
 build
+# tutorials are auto-generated
+tutorials
--- a/docs/README.md
+++ b/docs/README.md
+DGL document and tutorial folder
+================================
+To build,
+```
+make html
+```
+and then render the page `build/html/index.html`.
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -45,6 +45,7 @@ extensions = [
    'sphinx.ext.mathjax',
    'sphinx.ext.napoleon',
    'sphinx.ext.viewcode',
+    'sphinx_gallery.gen_gallery',
 ]
 # Add any paths that contain templates here, relative to this directory.
@@ -133,7 +134,7 @@ latex_elements = {
 # (source start file, target name, title,
 #  author, documentclass [howto, manual, or own class]).
 latex_documents = [
-    (master_doc, 'dgl.tex', 'dgl Documentation',
+    (master_doc, 'dgl.tex', 'DGL Documentation',
     'DGL Team', 'manual'),
 ]
@@ -143,7 +144,7 @@ latex_documents = [
 # One entry per manual page. List of tuples
 # (source start file, name, description, authors, manual section).
 man_pages = [
-    (master_doc, 'dgl', 'dgl Documentation',
+    (master_doc, 'dgl', 'DGL Documentation',
     [author], 1)
 ]
@@ -154,8 +155,8 @@ man_pages = [
 # (source start file, target name, title, author,
 #  dir menu entry, description, category)
 texinfo_documents = [
-    (master_doc, 'dgl', 'dgl Documentation',
+    (master_doc, 'dgl', 'DGL Documentation',
-     author, 'dgl', 'One line description of project.',
+     author, 'dgl', 'Library for deep learning on graphs.',
     'Miscellaneous'),
 ]
@@ -179,3 +180,13 @@ epub_exclude_files = ['search.html']
 # -- Extension configuration -------------------------------------------------
+# sphinx gallery configurations
+examples_dirs = ['../../tutorials']  # path to find sources
+gallery_dirs = ['tutorials']  # path to generate docs
+sphinx_gallery_conf = {
+    'examples_dirs' : examples_dirs,
+    'gallery_dirs' : gallery_dirs,
+    'filename_pattern' : '.py',
+}
--- a/docs/source/install/index.rst
+++ b/docs/source/install/index.rst
@@ -72,3 +72,23 @@ built above. Use following command to test whether the installation is successfu
 Install from docker
 -------------------
 TBD
+Install on Windows/MinGW
+------------------------
+Make sure you have the following installed:
+* CMake
+* MinGW/GCC (G++)
+* MinGW/Make
+You can grab them from Anaconda.
+In the command line prompt, run:
+.. code:: bash
+    md build
+    cd build
+    cmake -DCMAKE_CXX_FLAGS="-DDMLC_LOG_STACK_TRACE=0 -DTVM_EXPORTS" .. -G "MinGW Makefiles"
+    mingw32-make
+    set DGL_LIBRARY_PATH=%CD%
--- a/docs/source/tutorials/index.rst
+++ b/docs/source/tutorials/index.rst
-Tutorials
-=========
-TBD: Get started on DGL
--- a/graph-api.png
+++ b/graph-api.png
--- a/python/dgl/frame.py
+++ b/python/dgl/frame.py
@@ -251,7 +251,7 @@ class Frame(MutableMapping):
        if self.num_rows == 0:
            raise DGLError('Cannot add column "%s" using column schemes because'
                           ' number of rows is unknown. Make sure there is at least'
-                           ' one column in the frame so number of rows can be inferred.')
+                           ' one column in the frame so number of rows can be inferred.' % name)
        if self.initializer is None:
            dgl_warning('Initializer is not set. Use zero initializer instead.'
                        ' To suppress this warning, use `set_initializer` to'

--- a/tutorials/README.txt
+++ b/tutorials/README.txt
+Tutorials
+=========
+These are some first DGL tutorials you want to read.
--- a/tutorials/first.py
+++ b/tutorials/first.py
+"""
+Your first example in DGL
+=========================
+TODO: either a pagerank or SSSP example
+"""
+###############################################################################
+# Create a DGLGraph
+# -----------------
+#
+# To start with, let's first import dgl
+import dgl
--- a/tutorials/graph.py
+++ b/tutorials/graph.py
+"""
+Use DGLGraph
+============
+In this tutorial, we introduce how to use our graph class -- ``DGLGraph``.
+The ``DGLGraph`` is the very core data structure in our library. It provides the basic
+interfaces to manipulate graph structure, set/get node/edge features and convert
+from/to many other graph formats. You can also perform computation on the graph
+using our message passing APIs. (TODO: give a link here to the message passing doc)
+"""
+###############################################################################
+# Construct a graph
+# -----------------
+# 
+# In ``DGLGraph``, all nodes are represented using consecutive integers starting from
+# zero. All edges are directed. Let us start by creating a star network of 10 nodes
+# where all the edges point to the center node (node#0).
+# TODO(minjie): it's better to plot the graph here.
+import dgl
+star = dgl.DGLGraph()
+star.add_nodes(10)  # add 10 nodes
+for i in range(1, 10):
+    star.add_edge(i, 0)
+print('#Nodes:', star.number_of_nodes())
+print('#Edges:', star.number_of_edges())
+###############################################################################
+# ``DGLGraph`` also supports adding multiple edges at once by providing multiple
+# source and destination nodes. Multiple nodes are represented using either a
+# list or a 1D integer tensor(vector). In addition to this, we also support
+# "edge broadcasting":
+#
+# .. note::
+# 
+#   Given two source and destination node list/tensor ``u`` and ``v``.
+#
+#   - If ``len(u) == len(v)``, then this is a many-many edge set and
+#     each edge is represented by ``(u[i], v[i])``.
+#   - If ``len(u) == 1``, then this is a one-many edge set.
+#   - If ``len(v) == 1``, then this is a many-one edge set.
+#
+# Edge broadcasting is supported in many APIs whenever a bunch of edges need
+# to be specified. The example below creates the same star graph as the previous one.
+star.clear()  # clear the previous graph
+star.add_nodes(10)
+u = list(range(1, 10))  # can also use tensor type here (e.g. torch.Tensor)
+star.add_edges(u, 0)  # many-one edge set
+print('#Nodes:', star.number_of_nodes())
+print('#Edges:', star.number_of_edges())
+###############################################################################
+# In ``DGLGraph``, each edge is assigned an internal edge id (also a consecutive
+# integer starting from zero). The ids follow the addition order of the edges
+# and you can query the id using the ``edge_ids`` interface.
+print(star.edge_ids(1, 0))  # the first edge
+print(star.edge_ids([8, 9], 0))  # ask for ids of multiple edges
+###############################################################################
+# Assigning consecutive integer ids for nodes and edges makes it easier to batch
+# their features together (see next section). As a result, removing nodes or edges
+# of a ``DGLGraph`` is currently not supported because this will break the assumption
+# that the ids form a consecutive range from zero.
+###############################################################################
+# Node and edge features
+# ----------------------
+# Nodes and edges can have feature data in tensor type. They can be accessed/updated
+# through a key-value storage interface. The key must be hashable. The value should
+# be features of each node and edge batched on the *first* dimension. For example,
+# following codes create features for all nodes (``hv``) and features for all
+# edges (``he``). Each feature is a vector of length 3.
+#
+# .. note::
+#
+#   The first dimension is usually reserved as batch dimension in DGL. Thus, even setting
+#   only one node/edge still needs to have an extra dimension (of length one).
+import torch as th
+D = 3  # the feature dimension
+N = star.number_of_nodes()
+M = star.number_of_edges()
+nfeat = th.randn((N, D))  # some random node features
+efeat = th.randn((M, D))  # some random edge features
+# TODO(minjie): enable following syntax
+# star.nodes[:]['hv'] = nfeat
+# star.edges[:]['he'] = efeat
+star.set_n_repr({'hv' : nfeat})
+star.set_e_repr({'he' : efeat})
+###############################################################################
+# We can then set some nodes' features to be zero.
+# TODO(minjie): enable following syntax
+# print(star.nodes[:]['hv'])
+print(star.get_n_repr()['hv'])
+# set node 0, 2, 4 feature to zero
+star.set_n_repr({'hv' : th.zeros((3, D))}, [0, 2, 4])
+print(star.get_n_repr()['hv'])
+###############################################################################
+# Once created, each node/edge feature will be associated with a *scheme* containing
+# the shape, dtype information of the feature tensor. Updating features using data
+# of different scheme will raise error unless all the features are updated,
+# in which case the scheme will be replaced with the new one.
+print(star.node_attr_schemes())
+# updating features with different scheme will raise error
+# star.set_n_repr({'hv' : th.zeros((3, 2*D))}, [0, 2, 4])
+# updating all the nodes is fine, the old scheme will be replaced
+star.set_n_repr({'hv' : th.zeros((N, 2*D))})
+print(star.node_attr_schemes())
+###############################################################################
+# If a new feature is added for some but not all of the nodes/edges, we will
+# automatically create empty features for the others to make sure that features are
+# always aligned. By default, we fill zero for the empty features. The behavior
+# can be changed using ``set_n_initializer`` and ``set_e_initializer``.
+star.set_n_repr({'hv_1' : th.randn((3, D+1))}, [0, 2, 4])
+print(star.node_attr_schemes())
+print(star.get_n_repr()['hv_1'])
+###############################################################################
+# Convert from/to other formats
+# -----------------------------
+# DGLGraph can be easily converted from/to ``networkx`` graph.
+import networkx as nx
+# note that networkx create undirected graph by default, so when converting
+# to DGLGraph, directed edges of both directions will be added.
+nx_star = nx.star_graph(9)
+star = dgl.DGLGraph(nx_star)
+print('#Nodes:', star.number_of_nodes())
+print('#Edges:', star.number_of_edges())
+###############################################################################
+# Node and edge attributes can be automatically batched when converting from
+# ``networkx`` graph. Since ``networkx`` graph by default does not tell which
+# edge is added the first, we use the ``"id"`` edge attribute as a hint
+# if available.
+for i in range(10):
+    nx_star.nodes[i]['feat'] = th.randn((D,))
+star = dgl.DGLGraph()
+star.from_networkx(nx_star, node_attrs=['feat'])  # auto-batch specified node features
+print(star.get_n_repr()['feat'])
+###############################################################################
+# Multi-edge graph
+# ----------------
+# There are many applications that work on graphs containing multi-edges. To enable
+# this, construct ``DGLGraph`` with ``multigraph=True``.
+g = dgl.DGLGraph(multigraph=True)
+g.add_nodes(5)
+g.add_edge(0, 1)
+g.add_edge(1, 2)
+g.add_edge(0, 1)
+print('#Nodes:', g.number_of_nodes())
+print('#Edges:', g.number_of_edges())
+# init random edge features
+M = g.number_of_edges()
+g.set_e_repr({'he' : th.randn((M, D))})
+###############################################################################
+# Because an edge in multi-graph cannot be uniquely identified using its incident
+# nodes ``u`` and ``v``, you need to use edge id to access edge features. The
+# edge ids can be queried from ``edge_id`` interface.
+eid_01 = g.edge_id(0, 1)
+print(eid_01)
+###############################################################################
+# We can then use the edge id to set/get the features of the corresponding edge.
+g.set_e_repr_by_id({'he' : th.ones(len(eid_01), D)}, eid=eid_01)
+print(g.get_e_repr()['he'])