Fix caching during conditional execution

kpot · kpot · commit 48dbd64fdcdf · 2018-06-25T14:27:30.000+05:00
diff --git a/include/avalanche/ExecutionCache.h b/include/avalanche/ExecutionCache.h
@@ -21,6 +21,7 @@ class ExecutionCache : private CachedItemsMap {
     explicit ExecutionCache(DeviceIndex device_idx);
     explicit ExecutionCache(BufferPoolRef buffer_pool);
     bool get_from_cache_no_counter(NodeId node_id, MultiArrayRef &result) const;
+    bool is_cached(const NodeId node_id) const;
     void zero_reuse_counters();
     void put(const NodeId node_id, const MultiArrayRef &array);
     void set_node_params(NodeId node_id,
diff --git a/src/avalanche/ExecutionCache.cpp b/src/avalanche/ExecutionCache.cpp
@@ -96,5 +96,10 @@ bool ExecutionCache::get_info(NodeId node_id, CachedItem &info) const {
     return false;
 }
 
+bool ExecutionCache::is_cached(const NodeId node_id) const {
+    auto cached = find(node_id);
+    return cached != this->end() && cached->second.data;
+}
+
 
 } // namespace
diff --git a/src/avalanche/conditional_nodes.cpp b/src/avalanche/conditional_nodes.cpp
@@ -45,6 +45,48 @@ Cond::Cond(const NodeRef &condition, const NodeRef &true_node,
     }
 }
 
+/**
+ * Makes sure all inputs of the given node have been evaluated, without
+ * evaluating the node itself, unless it has already been evaluated
+ * and cached previously. This it necessary for proper work of the Cond
+ * node by two reasons:
+ * 1. To match the behaviour of `cond` from TF, which is this (a quote):
+ *
+ *        Note that the conditional execution applies only to the operations
+ *        defined in true_fn and false_fn. Consider the following simple program:
+ *
+ *        z = tf.multiply(a, b)
+ *        result = tf.cond(x < y, lambda: tf.add(x, z), lambda: tf.square(y))
+ *
+ *        If x < y, the tf.add operation will be executed and tf.square
+ *        operation will not be executed. Since z is needed for at least
+ *        one branch of the cond, the tf.multiply operation is always executed,
+ *        unconditionally. Although this behavior is consistent with
+ *        the dataflow model of TensorFlow, it has occasionally surprised
+ *        some users who expected a lazier semantics.
+ *
+ *        https://www.tensorflow.org/api_docs/python/tf/cond
+ *
+ * 2. Such evaluation helps to make sure we don't have any values stored
+ *    in cache with counters > 0 waiting to be used during the run.
+ *    By evaluating those nodes we imitate usage of them as inputs, thus
+ *    making sure that caching works as expected.
+ */
+
+void evaluate_inputs_of(const NodeRef &node, Context &context,
+                        ExecutionCache &cache) {
+    if (cache.is_cached(node->id)) {
+        // the node (and its inputs) has already been evaluated before,
+        // because it's present in the cache. We evaluate it once more
+        // (no actual work will be done) to decrease the cache counter.
+        node->eval(context, cache);
+    } else {
+        for (const auto &inp: node->inputs()) {
+            inp->eval(context, cache);
+        }
+    }
+}
+
 MultiArrayRef Cond::eval(Context &context, ExecutionCache &cache) const {
     MultiArrayRef result;
     if (!cache.get(id, result)) {
@@ -53,8 +95,10 @@ MultiArrayRef Cond::eval(Context &context, ExecutionCache &cache) const {
         cond_value->fetch_data_into(condition);
         if (condition[0]) {
             result = _true_node->eval(context, cache);
+            evaluate_inputs_of(_false_node, context, cache);
         } else {
             result = _false_node->eval(context, cache);
+            evaluate_inputs_of(_true_node, context, cache);
         }
         cache.put(id, result);
     }
diff --git a/test/test_tree_evaluation.cpp b/test/test_tree_evaluation.cpp
@@ -141,17 +141,18 @@ TEST_CASE("Conditional evaluation") {
     auto update1 = F<UpdateAdd>(var1, one);
     auto update2 = F<UpdateAdd>(var2, one);
     auto output = Cond::make(condition, update1, update2);
-    // Only var2 should be incremented, because condition == 0
+    INFO("Check chat only var2 should be incremented, because condition == 0");
     context->init<std::int8_t>(condition, {0});
     evaluate_and_check<float>(output, {1}, Shape(), context);
     evaluate_and_check<float>(var1, {0}, Shape(), context);
     evaluate_and_check<float>(var2, {1}, Shape(), context);
-    // Now only var1 should be incremented, because condition == 1
+    INFO("Now only var1 should be incremented, because condition == 1");
     context->init<std::int8_t>(condition, {1});
     evaluate_and_check<float>(output, {1}, Shape(), context);
     evaluate_and_check<float>(var1, {1}, Shape(), context);
     evaluate_and_check<float>(var2, {1}, Shape(), context);
-    // Again only var1 should be incremented, because condition is still == 1
+    INFO("Again only var1 should be incremented, "
+         "because condition is still == 1");
     evaluate_and_check<float>(output, {2}, Shape(), context);
     evaluate_and_check<float>(var1, {2}, Shape(), context);
     evaluate_and_check<float>(var2, {1}, Shape(), context);

Original file line number	Diff line number	Diff line change
`@@ -96,5 +96,10 @@ bool ExecutionCache::get_info(NodeId node_id, CachedItem &info) const {`
`96`	`96`	`return false;`
`97`	`97`	`}`
`98`	`98`
	`99`	`+bool ExecutionCache::is_cached(const NodeId node_id) const {`
	`100`	`+ auto cached = find(node_id);`
	`101`	`+ return cached != this->end() && cached->second.data;`
	`102`	`+}`
	`103`	`+`
`99`	`104`
`100`	`105`	`} // namespace`