arangodb
diff --git a/‎site/content/3.10/data-science/adapters/arangodb-cugraph-adapter.md‎
Lines changed: 90 additions & 34 deletions b/‎site/content/3.10/data-science/adapters/arangodb-cugraph-adapter.md‎
Lines changed: 90 additions & 34 deletions
diff --git a/‎site/content/3.10/data-science/adapters/arangodb-dgl-adapter.md‎
Lines changed: 199 additions & 22 deletions b/‎site/content/3.10/data-science/adapters/arangodb-dgl-adapter.md‎
Lines changed: 199 additions & 22 deletions
@@ -24,7 +24,8 @@ To install the latest release of the ArangoDB-cuGraph Adapter,
 run the following command:
 
 ```bash
-conda install -c arangodb adbcug-adapter
+pip install --extra-index-url=https://pypi.nvidia.com cudf-cu11 cugraph-cu11
+pip install adbcug-adapter
 ```
 
 ## Quickstart
@@ -36,53 +37,108 @@ Check also the
 ```py
 import cudf
 import cugraph
-from arango import ArangoClient # Python-Arango driver
 
-from adbcug_adapter import ADBCUG_Adapter
+from arango import ArangoClient
+from adbcug_adapter import ADBCUG_Adapter, ADBCUG_Controller
 
-# Let's assume that the ArangoDB "fraud detection" dataset is imported to this endpoint
-db = ArangoClient(hosts="http://localhost:8529").db("_system", username="root", password="")
+# Connect to ArangoDB
+db = ArangoClient().db()
 
+# Instantiate the adapter
 adbcug_adapter = ADBCUG_Adapter(db)
+```
+
+### ArangoDB to cuGraph
+```py
+#######################
+# 1.1: via Graph name #
+#######################
 
-# Use Case 1.1: ArangoDB to cuGraph via Graph name
-cug_fraud_graph = adbcug_adapter.arangodb_graph_to_cugraph("fraud-detection")
+cug_g = adbcug_adapter.arangodb_graph_to_cugraph("fraud-detection")
 
-# Use Case 1.2: ArangoDB to cuGraph via Collection names
-cug_fraud_graph_2 = adbcug_adapter.arangodb_collections_to_cugraph(
+#############################
+# 1.2: via Collection names #
+#############################
+
+cug_g = adbcug_adapter.arangodb_collections_to_cugraph(
     "fraud-detection",
     {"account", "bank", "branch", "Class", "customer"},  #  Vertex collections
     {"accountHolder", "Relationship", "transaction"},  # Edge collections
 )
+```
 
-# Use Case 2: cuGraph to ArangoDB:
-## 1) Create a sample cuGraph
-cug_divisibility_graph = cugraph.MultiGraph(directed=True)
-cug_divisibility_graph.from_cudf_edgelist(
-    cudf.DataFrame(
-        [
-            (f"numbers/{j}", f"numbers/{i}", j / i)
-            for i in range(1, 101)
-            for j in range(1, 101)
-            if j % i == 0
-        ],
-        columns=["src", "dst", "weight"],
-    ),
-    source="src",
-    destination="dst",
-    edge_attr="weight",
-    renumber=False,
-)
+### cuGraph to ArangoDB
+```py
+#################################
+# 2.1: with a Homogeneous Graph #
+#################################
+
+edges = [("Person/A", "Person/B", 1), ("Person/B", "Person/C", -1)]
+cug_g = cugraph.MultiGraph(directed=True)
+cug_g.from_cudf_edgelist(cudf.DataFrame(edges, columns=["src", "dst", "weight"]), source="src", destination="dst", edge_attr="weight")
 
-## 2) Create ArangoDB Edge Definitions
 edge_definitions = [
     {
-        "edge_collection": "is_divisible_by",
-        "from_vertex_collections": ["numbers"],
-        "to_vertex_collections": ["numbers"],
+        "edge_collection": "knows",
+        "from_vertex_collections": ["Person"],
+        "to_vertex_collections": ["Person"],
     }
 ]
 
-## 3) Convert cuGraph to ArangoDB
-adb_graph = adbcug_adapter.cugraph_to_arangodb("DivisibilityGraph", cug_graph, edge_definitions)
-```
+adb_g = adbcug_adapter.cugraph_to_arangodb("Knows", cug_g, edge_definitions, edge_attr="weight")
+
+##############################################################
+# 2.2: with a Homogeneous Graph & a custom ADBCUG Controller #
+##############################################################
+
+class Custom_ADBCUG_Controller(ADBCUG_Controller):
+    """ArangoDB-cuGraph controller.
+
+    Responsible for controlling how nodes & edges are handled when
+    transitioning from ArangoDB to cuGraph & vice-versa.
+    """
+
+    def _prepare_cugraph_node(self, cug_node: dict, col: str) -> None:
+        """Prepare a cuGraph node before it gets inserted into the ArangoDB
+        collection **col**.
+
+        :param cug_node: The cuGraph node object to (optionally) modify.
+        :param col: The ArangoDB collection the node belongs to.
+        """
+        cug_node["foo"] = "bar"
+
+    def _prepare_cugraph_edge(self, cug_edge: dict, col: str) -> None:
+        """Prepare a cuGraph edge before it gets inserted into the ArangoDB
+        collection **col**.
+
+        :param cug_edge: The cuGraph edge object to (optionally) modify.
+        :param col: The ArangoDB collection the edge belongs to.
+        """
+        cug_edge["bar"] = "foo"
+
+adb_g = ADBCUG_Adapter(db, Custom_ADBCUG_Controller()).cugraph_to_arangodb("Knows", cug_g, edge_definitions)
+
+###################################
+# 2.3: with a Heterogeneous Graph #
+###################################
+
+edges = [
+   ('student:101', 'lecture:101'), 
+   ('student:102', 'lecture:102'), 
+   ('student:103', 'lecture:103'), 
+   ('student:103', 'student:101'), 
+   ('student:103', 'student:102'),
+   ('teacher:101', 'lecture:101'),
+   ('teacher:102', 'lecture:102'),
+   ('teacher:103', 'lecture:103'),
+   ('teacher:101', 'teacher:102'),
+   ('teacher:102', 'teacher:103')
+]
+cug_g = cugraph.MultiGraph(directed=True)
+cug_g.from_cudf_edgelist(cudf.DataFrame(edges, columns=["src", "dst"]), source='src', destination='dst')
+
+# ...
+
+# Learn how this example is handled in Colab:
+# https://colab.research.google.com/github/arangoml/cugraph-adapter/blob/master/examples/ArangoDB_cuGraph_Adapter.ipynb#scrollTo=nuVoCZQv6oyi
+```
@@ -38,38 +38,215 @@ Check also the
 [interactive tutorial](https://colab.research.google.com/github/arangoml/dgl-adapter/blob/master/examples/ArangoDB_DGL_Adapter.ipynb).
 
 ```py
-from arango import ArangoClient  # Python-Arango driver
-from dgl.data import KarateClubDataset # Sample graph from DGL
+import dgl
+import torch
+import pandas
 
-# Let's assume that the ArangoDB "fraud detection" dataset is imported to this endpoint
-db = ArangoClient(hosts="http://localhost:8529").db("_system", username="root", password="")
+from arango import ArangoClient
+from adbdgl_adapter import ADBDGL_Adapter, ADBDGL_Controller
+from adbdgl_adapter.encoders import IdentityEncoder, CategoricalEncoder
 
+# Connect to ArangoDB
+db = ArangoClient().db()
+
+# Instantiate the adapter
 adbdgl_adapter = ADBDGL_Adapter(db)
 
-# Use Case 1.1: ArangoDB to DGL via Graph name
-dgl_fraud_graph = adbdgl_adapter.arangodb_graph_to_dgl("fraud-detection")
+# Create a DGL Heterogeneous Graph
+fake_hetero = dgl.heterograph({
+    ("user", "follows", "user"): (torch.tensor([0, 1]), torch.tensor([1, 2])),
+    ("user", "follows", "topic"): (torch.tensor([1, 1]), torch.tensor([1, 2])),
+    ("user", "plays", "game"): (torch.tensor([0, 3]), torch.tensor([3, 4])),
+})
+fake_hetero.nodes["user"].data["features"] = torch.tensor([21, 44, 16, 25])
+fake_hetero.nodes["user"].data["label"] = torch.tensor([1, 2, 0, 1])
+fake_hetero.nodes["game"].data["features"] = torch.tensor([[0, 0], [0, 1], [1, 0], [1, 1], [1, 1]])
+fake_hetero.edges[("user", "plays", "game")].data["features"] = torch.tensor([[6, 1], [1000, 0]])
+```
+
+### DGL to ArangoDB
+```py
+############################
+# 1.1: without a Metagraph #
+############################
 
-# Use Case 1.2: ArangoDB to DGL via Collection names
-dgl_fraud_graph_2 = adbdgl_adapter.arangodb_collections_to_dgl(
-    "fraud-detection",
-    {"account", "Class", "customer"},  # Vertex collections
-    {"accountHolder", "Relationship", "transaction"},  # Edge collections
-)
+adb_g = adbdgl_adapter.dgl_to_arangodb("FakeHetero", fake_hetero)
 
-# Use Case 1.3: ArangoDB to DGL via Metagraph
+#########################
+# 1.2: with a Metagraph #
+#########################
+
+# Specifying a Metagraph provides customized adapter behaviour
 metagraph = {
+    "nodeTypes": {
+        "user": {
+            "features": "user_age",  # 1) you can specify a string value for attribute renaming
+            "label": label_tensor_to_2_column_dataframe,  # 2) you can specify a function for user-defined handling, as long as the function returns a Pandas DataFrame
+        },
+        # 3) You can specify set of strings if you want to preserve the same DGL attribute names for the node/edge type
+        "game": {"features"} # this is equivalent to {"features": "features"}
+    },
+    "edgeTypes": {
+        ("user", "plays", "game"): {
+            # 4) you can specify a list of strings for tensor dissasembly (if you know the number of node/edge features in advance)
+            "features": ["hours_played", "is_satisfied_with_game"]
+        },
+    },
+}
+
+def label_tensor_to_2_column_dataframe(dgl_tensor: torch.Tensor, adb_df: pandas.DataFrame) -> pandas.DataFrame:
+    """A user-defined function to create two
+    ArangoDB attributes out of the 'user' label tensor
+
+    :param dgl_tensor: The DGL Tensor containing the data
+    :type dgl_tensor: torch.Tensor
+    :param adb_df: The ArangoDB DataFrame to populate, whose
+        size is preset to the length of **dgl_tensor**.
+    :type adb_df: pandas.DataFrame
+    :return: The populated ArangoDB DataFrame
+    :rtype: pandas.DataFrame
+    """
+    label_map = {0: "Class A", 1: "Class B", 2: "Class C"}
+
+    adb_df["label_num"] = dgl_tensor.tolist()
+    adb_df["label_str"] = adb_df["label_num"].map(label_map)
+
+    return adb_df
+
+
+adb_g = adbdgl_adapter.dgl_to_arangodb("FakeHetero", fake_hetero, metagraph, explicit_metagraph=False)
+
+#######################################################
+# 1.3: with a Metagraph and `explicit_metagraph=True` #
+#######################################################
+
+# With `explicit_metagraph=True`, the node & edge types omitted from the metagraph will NOT be converted to ArangoDB.
+adb_g = adbdgl_adapter.dgl_to_arangodb("FakeHetero", fake_hetero, metagraph, explicit_metagraph=True)
+
+########################################
+# 1.4: with a custom ADBDGL Controller #
+########################################
+
+class Custom_ADBDGL_Controller(ADBDGL_Controller):
+    def _prepare_dgl_node(self, dgl_node: dict, node_type: str) -> dict:
+        """Optionally modify a DGL node object before it gets inserted into its designated ArangoDB collection.
+
+        :param dgl_node: The DGL node object to (optionally) modify.
+        :param node_type: The DGL Node Type of the node.
+        :return: The DGL Node object
+        """
+        dgl_node["foo"] = "bar"
+        return dgl_node
+
+    def _prepare_dgl_edge(self, dgl_edge: dict, edge_type: tuple) -> dict:
+        """Optionally modify a DGL edge object before it gets inserted into its designated ArangoDB collection.
+
+        :param dgl_edge: The DGL edge object to (optionally) modify.
+        :param edge_type: The Edge Type of the DGL edge. Formatted
+            as (from_collection, edge_collection, to_collection)
+        :return: The DGL Edge object
+        """
+        dgl_edge["bar"] = "foo"
+        return dgl_edge
+
+
+adb_g = ADBDGL_Adapter(db, Custom_ADBDGL_Controller()).dgl_to_arangodb("FakeHetero", fake_hetero)
+```
+
+### ArangoDB to DGL
+```py
+# Start from scratch!
+db.delete_graph("FakeHetero", drop_collections=True, ignore_missing=True)
+adbdgl_adapter.dgl_to_arangodb("FakeHetero", fake_hetero)
+
+#######################
+# 2.1: via Graph name #
+#######################
+
+# Due to risk of ambiguity, this method does not transfer attributes
+dgl_g = adbdgl_adapter.arangodb_graph_to_dgl("FakeHetero")
+
+#############################
+# 2.2: via Collection names #
+#############################
+
+# Due to risk of ambiguity, this method does not transfer attributes
+dgl_g = adbdgl_adapter.arangodb_collections_to_dgl("FakeHetero", v_cols={"user", "game"}, e_cols={"plays"})
+
+######################
+# 2.3: via Metagraph #
+######################
+
+# Transfers attributes "as is", meaning they are already formatted to DGL data standards.
+# Learn more about the DGL Data Standards here: https://docs.dgl.ai/guide/graph.html#guide-graph
+metagraph_v1 = {
     "vertexCollections": {
-        "account": {"Balance", "account_type", "customer_id", "rank"},
-        "customer": {"Name", "rank"},
+        # Move the "features" & "label" ArangoDB attributes to DGL as "features" & "label" Tensors
+        "user": {"features", "label"}, # equivalent to {"features": "features", "label": "label"}
+        "game": {"dgl_game_features": "features"},
+        "topic": {},
     },
     "edgeCollections": {
-        "transaction": {"transaction_amt", "sender_bank_id", "receiver_bank_id"},
-        "accountHolder": {},
+        "plays": {"dgl_plays_features": "features"}, 
+        "follows": {}
     },
 }
-dgl_fraud_graph_3 = adbdgl_adapter.arangodb_to_dgl("fraud-detection", metagraph)
 
-# Use Case 2: DGL to ArangoDB
-dgl_karate_graph = KarateClubDataset()[0]
-adb_karate_graph = adbdgl_adapter.dgl_to_arangodb("Karate", dgl_karate_graph)
-```
+dgl_g = adbdgl_adapter.arangodb_to_dgl("FakeHetero", metagraph_v1)
+
+#################################################
+# 2.4: via Metagraph with user-defined encoders #
+#################################################
+
+# Transforms attributes via user-defined encoders
+metagraph_v2 = {
+    "vertexCollections": {
+        "Movies": {
+            "features": {  # Build a feature matrix from the "Action" & "Drama" document attributes
+                "Action": IdentityEncoder(dtype=torch.long),
+                "Drama": IdentityEncoder(dtype=torch.long),
+            },
+            "label": "Comedy",
+        },
+        "Users": {
+            "features": {
+                "Gender": CategoricalEncoder(), # CategoricalEncoder(mapping={"M": 0, "F": 1}),
+                "Age": IdentityEncoder(dtype=torch.long),
+            }
+        },
+    },
+    "edgeCollections": {"Ratings": {"weight": "Rating"}},
+}
+
+dgl_g = adbdgl_adapter.arangodb_to_dgl("imdb", metagraph_v2)
+
+##################################################
+# 2.5: via Metagraph with user-defined functions #
+##################################################
+
+# Transforms attributes via user-defined functions
+metagraph_v3 = {
+    "vertexCollections": {
+        "user": {
+            "features": udf_user_features,  # supports named functions
+            "label": lambda df: torch.tensor(df["label"].to_list()),  # also supports lambda functions
+        },
+        "game": {"features": udf_game_features},
+    },
+    "edgeCollections": {
+        "plays": {"features": (lambda df: torch.tensor(df["features"].to_list()))},
+    },
+}
+
+def udf_user_features(user_df: pandas.DataFrame) -> torch.Tensor:
+   # user_df["features"] = ...
+    return torch.tensor(user_df["features"].to_list())
+
+
+def udf_game_features(game_df: pandas.DataFrame) -> torch.Tensor:
+    # game_df["features"] = ...
+    return torch.tensor(game_df["features"].to_list())
+
+
+dgl_g = adbdgl_adapter.arangodb_to_dgl("FakeHetero", metagraph_v3)
+```