feat(torque): add 6 new query methods for graph traversal (#57)

arun1729 · web-flow · commit d1da062375e7 · 2025-12-23T15:27:28.000-05:00
* feat(torque): add 6 new query methods for graph traversal

New methods:
- both(predicates): traverse edges in both directions
- is_(*nodes): filter to specific nodes
- unique(): remove duplicate vertices from results
- limit(n): limit results to first N vertices
- skip(n): skip first N vertices in results
- back(tag): return to previously tagged position

Includes 18 new tests and README documentation

* adding discord link

* chore: bump version to 3.2.0
diff --git a/README.md b/README.md
@@ -1,17 +1,14 @@
 ![](https://static.pepy.tech/badge/cogdb) [![PyPI version](https://badge.fury.io/py/cogdb.svg)](https://badge.fury.io/py/cogdb) ![Python 3.8](https://img.shields.io/badge/python-3.8+-blue.svg)
- [![Build Status](https://travis-ci.org/arun1729/cog.svg?branch=master)](https://travis-ci.org/arun1729/cog) [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT) [![codecov](https://codecov.io/gh/arun1729/cog/branch/master/graph/badge.svg)](https://codecov.io/gh/arun1729/cog)
+ [![Build Status](https://travis-ci.org/arun1729/cog.svg?branch=master)](https://travis-ci.org/arun1729/cog) [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT) [![codecov](https://codecov.io/gh/arun1729/cog/branch/master/graph/badge.svg)](https://codecov.io/gh/arun1729/cog) [![Discord](https://img.shields.io/badge/Discord-Join%20Server-7289da?logo=discord&logoColor=white)](https://discord.gg/nqNpNGfjts)
 
 # ![logo](cog-logo.png)
 # CogDB - Micro Graph Database for Python Applications
 > Documents and examples at [cogdb.io](https://cogdb.io)
 
-> New release: 3.1.0
-> - **Batch insert mode** for significantly faster bulk graph loading
-> - New `put_batch()` method for efficient triple insertion
-> - Performance improvements: up to 1.6x faster inserts at scale
-> - New word embeddings API
-> - Similarity filtering using word embeddings
-> - Filter step
+> New release: 3.2.0
+> - New Torque query methods: `both()`, `is_()`, `unique()`, `limit()`, `skip()`, `back()`
+> - Bidirectional traversal and pagination support
+> - Navigate back to tagged vertices
 
 ![ScreenShot](notes/ex2.png)
 
@@ -182,6 +179,52 @@ g.v("emily").out("follows").filter(func=lambda x: x.startswith("f")).all()
 ```
 > {'result': [{'id': 'fred'}]}
 
+#### Bidirectional Traversal
+
+Follow edges in both directions (outgoing and incoming):
+```python
+g.v("bob").both("follows").all()
+```
+> {'result': [{'id': 'fred'}, {'id': 'alice'}, {'id': 'charlie'}, {'id': 'dani'}]}
+
+#### Filter to Specific Nodes
+
+Filter results to only include specific vertices:
+```python
+g.v("alice").out("follows").is_("bob", "dani").all()
+```
+> {'result': [{'id': 'bob'}, {'id': 'dani'}]}
+
+#### Remove Duplicates
+
+Remove duplicate vertices from results:
+```python
+g.v().out("follows").unique().all()
+```
+> {'result': [{'id': 'bob'}, {'id': 'fred'}, {'id': 'greg'}, {'id': 'dani'}]}
+
+#### Pagination with Limit and Skip
+
+Limit results to first N vertices:
+```python
+g.v().limit(3).all()
+```
+> {'result': [{'id': 'alice'}, {'id': 'bob'}, {'id': 'charlie'}]}
+
+Skip first N vertices:
+```python
+g.v().skip(2).limit(2).all()
+```
+> {'result': [{'id': 'charlie'}, {'id': 'dani'}]}
+
+#### Navigate Back to Tagged Vertex
+
+Return to a previously tagged position while preserving the traversal path:
+```python
+g.v("alice").tag("start").out("follows").out("follows").back("start").all()
+```
+> {'result': [{'start': 'alice', 'id': 'alice'}]}
+
 
 #### json example
 
diff --git a/cog/torque.py b/cog/torque.py
@@ -450,6 +450,114 @@ def filter(self, func):
         self.last_visited_vertices = [v for v in self.last_visited_vertices if func(v.id)]
         return self
 
+    def both(self, predicates=None):
+        '''
+        Traverse edges in both directions (out + in).
+        :param predicates: A string or list of predicate strings to follow.
+        :return: self for method chaining.
+        '''
+        if predicates is not None:
+            if not isinstance(predicates, list):
+                predicates = [predicates]
+            predicates = list(map(hash_predicate, predicates))
+        else:
+            predicates = self.all_predicates
+
+        self.cog.use_namespace(self.graph_name)
+        traverse_vertex = []
+
+        for predicate in predicates:
+            for v in self.last_visited_vertices:
+                # Outgoing edges
+                out_record = self.cog.use_table(predicate).get(out_nodes(v.id))
+                if out_record is not None:
+                    if out_record.value_type == "s":
+                        v_adj = Vertex(str(out_record.value)).set_edge(predicate)
+                        v_adj.tags.update(v.tags)
+                        traverse_vertex.append(v_adj)
+                    elif out_record.value_type == "l":
+                        for v_adjacent in out_record.value:
+                            v_adj = Vertex(v_adjacent).set_edge(predicate)
+                            v_adj.tags.update(v.tags)
+                            traverse_vertex.append(v_adj)
+
+                # Incoming edges
+                in_record = self.cog.use_table(predicate).get(in_nodes(v.id))
+                if in_record is not None:
+                    if in_record.value_type == "s":
+                        v_adj = Vertex(str(in_record.value)).set_edge(predicate)
+                        v_adj.tags.update(v.tags)
+                        traverse_vertex.append(v_adj)
+                    elif in_record.value_type == "l":
+                        for v_adjacent in in_record.value:
+                            v_adj = Vertex(v_adjacent).set_edge(predicate)
+                            v_adj.tags.update(v.tags)
+                            traverse_vertex.append(v_adj)
+
+        self.last_visited_vertices = traverse_vertex
+        return self
+
+    def is_(self, *nodes):
+        '''
+        Filter paths to only those currently at the specified node(s).
+        :param nodes: One or more node IDs to filter to.
+        :return: self for method chaining.
+        '''
+        if len(nodes) == 1 and isinstance(nodes[0], list):
+            node_set = set(nodes[0])
+        else:
+            node_set = set(nodes)
+        self.last_visited_vertices = [v for v in self.last_visited_vertices if v.id in node_set]
+        return self
+
+    def unique(self):
+        '''
+        Remove duplicate vertices from the result set.
+        :return: self for method chaining.
+        '''
+        seen = set()
+        unique_vertices = []
+        for v in self.last_visited_vertices:
+            if v.id not in seen:
+                seen.add(v.id)
+                unique_vertices.append(v)
+        self.last_visited_vertices = unique_vertices
+        return self
+
+    def limit(self, n):
+        '''
+        Limit results to the first N vertices.
+        :param n: Maximum number of vertices to return.
+        :return: self for method chaining.
+        '''
+        self.last_visited_vertices = self.last_visited_vertices[:n]
+        return self
+
+    def skip(self, n):
+        '''
+        Skip the first N vertices in the result set.
+        :param n: Number of vertices to skip.
+        :return: self for method chaining.
+        '''
+        self.last_visited_vertices = self.last_visited_vertices[n:]
+        return self
+
+    def back(self, tag):
+        '''
+        Return to vertices saved at the given tag, preserving all constraints.
+        :param tag: A previous tag in the query to jump back to.
+        :return: self for method chaining.
+        '''
+        vertices = []
+        for v in self.last_visited_vertices:
+            if tag in v.tags:
+                tagged_vertex = Vertex(v.tags[tag])
+                tagged_vertex.tags = v.tags.copy()
+                tagged_vertex.edges = v.edges.copy()
+                vertices.append(tagged_vertex)
+        self.last_visited_vertices = vertices
+        return self
+
     def sim(self, word, operator, threshold, strict=False):
         """
             Applies cosine similarity filter to the vertices and removes any vertices that do not pass the filter.
diff --git a/setup.py b/setup.py
@@ -2,7 +2,7 @@
 
 
 setup(name='cogdb',
-      version='3.1.0',
+      version='3.2.0',
       description='Persistent Embedded Graph Database',
       url='http://github.com/arun1729/cog',
       author='Arun Mahendra',
diff --git a/test/test_torque_extensions.py b/test/test_torque_extensions.py
@@ -0,0 +1,193 @@
+from cog.torque import Graph
+import unittest
+import os
+import shutil
+
+DIR_NAME = "TorqueExtensionsTest"
+
+
+def ordered(obj):
+    if isinstance(obj, dict):
+        return sorted((k, ordered(v)) for k, v in list(obj.items()))
+    if isinstance(obj, list):
+        return sorted(ordered(x) for x in obj)
+    else:
+        return obj
+
+
+class TorqueExtensionsTest(unittest.TestCase):
+    """
+    Tests for new Torque traversal methods:
+    - both(): bidirectional traversal
+    - is_(): filter to specific nodes
+    - unique(): remove duplicates
+    - limit(): limit results
+    - skip(): skip results
+    - back(): return to tagged position
+    """
+    maxDiff = None
+
+    @classmethod
+    def setUpClass(cls):
+        if os.path.exists("/tmp/" + DIR_NAME):
+            shutil.rmtree("/tmp/" + DIR_NAME)
+        os.mkdir("/tmp/" + DIR_NAME)
+
+        cls.g = Graph(graph_name="test_graph", cog_home=DIR_NAME)
+        # Create a simple test graph:
+        # alice -> bob -> charlie -> alice (cycle)
+        # alice -> dani
+        # bob has status "cool"
+        cls.g.put("alice", "follows", "bob")
+        cls.g.put("bob", "follows", "charlie")
+        cls.g.put("charlie", "follows", "alice")
+        cls.g.put("alice", "follows", "dani")
+        cls.g.put("bob", "status", "cool")
+        cls.g.put("dani", "status", "cool")
+        print(">>> TorqueExtensionsTest setup complete.\n")
+
+    # =========== both() tests ===========
+
+    def test_both_follows_from_bob(self):
+        """both() should return vertices connected by edges in either direction."""
+        result = self.g.v("bob").both("follows").all()
+        ids = {r['id'] for r in result['result']}
+        # bob follows charlie, alice follows bob
+        self.assertIn("charlie", ids)
+        self.assertIn("alice", ids)
+
+    def test_both_no_predicate(self):
+        """both() with no predicate should follow all edge types."""
+        result = self.g.v("bob").both().all()
+        ids = {r['id'] for r in result['result']}
+        # bob -> charlie (follows), alice -> bob (follows), bob -> cool (status)
+        self.assertIn("charlie", ids)
+        self.assertIn("alice", ids)
+        self.assertIn("cool", ids)
+
+    # =========== is_() tests ===========
+
+    def test_is_single_node(self):
+        """is_() should filter to only the specified node."""
+        result = self.g.v("alice").out("follows").is_("bob").all()
+        self.assertEqual(len(result['result']), 1)
+        self.assertEqual(result['result'][0]['id'], "bob")
+
+    def test_is_multiple_nodes(self):
+        """is_() should accept multiple nodes."""
+        result = self.g.v("alice").out("follows").is_("bob", "dani").all()
+        ids = {r['id'] for r in result['result']}
+        self.assertEqual(ids, {"bob", "dani"})
+
+    def test_is_no_match(self):
+        """is_() should return empty if no nodes match."""
+        result = self.g.v("alice").out("follows").is_("nonexistent").all()
+        self.assertEqual(result['result'], [])
+
+    def test_is_with_list(self):
+        """is_() should accept a list of nodes."""
+        result = self.g.v("alice").out("follows").is_(["bob", "dani"]).all()
+        ids = {r['id'] for r in result['result']}
+        self.assertEqual(ids, {"bob", "dani"})
+
+    # =========== unique() tests ===========
+
+    def test_unique_removes_duplicates(self):
+        """unique() should remove duplicate vertices."""
+        # Get all followers' statuses - "cool" appears twice (bob and dani)
+        result_without_unique = self.g.v("alice").out("follows").out("status").all()
+        result_with_unique = self.g.v("alice").out("follows").out("status").unique().all()
+
+        # Without unique, we should have duplicates
+        ids_without = [r['id'] for r in result_without_unique['result']]
+        self.assertEqual(ids_without.count("cool"), 2)
+
+        # With unique, no duplicates
+        ids_with = [r['id'] for r in result_with_unique['result']]
+        self.assertEqual(ids_with.count("cool"), 1)
+
+    def test_unique_preserves_order(self):
+        """unique() should preserve the order of first occurrence."""
+        result = self.g.v().unique().all()
+        # Should have vertices in order of first appearance
+        self.assertTrue(len(result['result']) > 0)
+
+    # =========== limit() tests ===========
+
+    def test_limit_returns_n_results(self):
+        """limit() should return at most N vertices."""
+        result = self.g.v().limit(2).all()
+        self.assertEqual(len(result['result']), 2)
+
+    def test_limit_more_than_available(self):
+        """limit() with N larger than result set should return all."""
+        all_result = self.g.v().all()
+        limited_result = self.g.v().limit(1000).all()
+        self.assertEqual(len(all_result['result']), len(limited_result['result']))
+
+    def test_limit_zero(self):
+        """limit(0) should return empty."""
+        result = self.g.v().limit(0).all()
+        self.assertEqual(result['result'], [])
+
+    # =========== skip() tests ===========
+
+    def test_skip_skips_n_results(self):
+        """skip() should skip the first N vertices."""
+        all_result = self.g.v().all()
+        skipped_result = self.g.v().skip(2).all()
+        self.assertEqual(len(skipped_result['result']), len(all_result['result']) - 2)
+
+    def test_skip_more_than_available(self):
+        """skip() with N larger than result set should return empty."""
+        result = self.g.v().skip(1000).all()
+        self.assertEqual(result['result'], [])
+
+    def test_limit_and_skip_pagination(self):
+        """limit() and skip() together enable pagination."""
+        all_result = self.g.v().all()
+        page1 = self.g.v().limit(2).all()
+        page2 = self.g.v().skip(2).limit(2).all()
+
+        # Pages should not overlap
+        page1_ids = {r['id'] for r in page1['result']}
+        page2_ids = {r['id'] for r in page2['result']}
+        self.assertEqual(len(page1_ids & page2_ids), 0)
+
+    # =========== back() tests ===========
+
+    def test_back_returns_to_tagged_vertex(self):
+        """back() should return to the previously tagged vertex."""
+        result = self.g.v("alice").tag("start").out("follows").back("start").all()
+        # Should return to alice
+        ids = {r['id'] for r in result['result']}
+        self.assertEqual(ids, {"alice"})
+
+    def test_back_preserves_tags(self):
+        """back() should preserve existing tags."""
+        result = self.g.v("alice").tag("origin").out("follows").tag("middle").back("origin").all()
+        for r in result['result']:
+            self.assertIn("origin", r)
+            self.assertIn("middle", r)
+
+    def test_back_with_invalid_tag(self):
+        """back() with non-existent tag should return empty."""
+        result = self.g.v("alice").out("follows").back("nonexistent").all()
+        self.assertEqual(result['result'], [])
+
+    def test_back_after_filter(self):
+        """back() should work with filtered results."""
+        result = self.g.v("alice").tag("start").out("follows").has("status", "cool").back("start").all()
+        # Only bob has status cool, so we should get back to alice (who follows bob)
+        ids = {r['id'] for r in result['result']}
+        self.assertEqual(ids, {"alice"})
+
+    @classmethod
+    def tearDownClass(cls):
+        cls.g.close()
+        shutil.rmtree("/tmp/" + DIR_NAME)
+        print("*** TorqueExtensionsTest cleanup complete.")
+
+
+if __name__ == '__main__':
+    unittest.main()