CogComp · bhargav · Apr 9, 2017 · Apr 9, 2017 · kordjamshidi · Jul 18, 2017
diff --git a/saul-core/doc/CONCEPTUALSTRUCTURE.md b/saul-core/doc/CONCEPTUALSTRUCTURE.md
@@ -37,19 +37,28 @@ In this definition `pos` is defined to be a property of nodes of type token. The
 inside `{ .... }` is  the definition of a sensor which given an object of type `ConllRawToken` i.e. the tye of node and
 generates an output property value (in this case, using the POS tag of an object of type `ConllRawToken`).
 
-If the content of a property is computationally intensive to compute, you can cache its value, by setting `cache` to be
+If the content of a property is computationally intensive to compute, you can cache its Feature Vector, by setting `cacheFeatureVector` to be
 `true`: 
 ```scala
-val pos = property(token, cache = true) {
+val pos = property(token, cacheFeatureVector = true) {
    (t: ConllRawToken) => t.POS
 }
 ```
 
-The first time that a property is called with a specific value, it would you remember the corresponding output, 
-so next time it just looks up the value from the cache. 
+During the first training iteration, the feature vector is computed and cached during further iterations of training/testing. This value is cached in-memory for the lifetime of the app. Using this feature judiciously and make sure you have enough free memory (RAM) available.
 
-Note that when training, the property cache is remove between two training interation in order not to interrupt 
-the trainng procedure. 
+If you want to cache the value of a feature during a single iteration, use the `cache` parameter.
+
+The `cache` parameter allows the value to be cached within a training/testing iteration. This is useful if you one of your features depends on evaluation of a Classifier on other instances as well. This recursive evaluation of the Classifier might be expensive and caching would speed-up performance. Look at a sample usage of this parameter in the [POSTagging Example](../../saul-examples/src/main/scala/edu/illinois/cs/cogcomp/saulexamples/nlp/POSTagger/POSDataModel.scala#L66).
+
+ Usage:
+ ```scala
+ val posWindow = property(token, cache = true) {
+    (t: ConllRawToken) => t.getNeighbors.map(n => posWindow(n))
+ }
+ ```
+
+ The value of these properties are cleared at the end of each training iteration.
 
 #### Parameterized properties 
 Suppose you want to define properties which get some parameters; this can be important when we want to programmatically 

diff --git a/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/classifier/Learnable.scala b/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/classifier/Learnable.scala
@@ -18,7 +18,7 @@ import edu.illinois.cs.cogcomp.lbjava.parse.FoldParser.SplitPolicy
 import edu.illinois.cs.cogcomp.lbjava.parse.{ FoldParser, Parser }
 import edu.illinois.cs.cogcomp.saul.datamodel.DataModel
 import edu.illinois.cs.cogcomp.saul.datamodel.edge.Link
-import edu.illinois.cs.cogcomp.saul.datamodel.node.Node
+import edu.illinois.cs.cogcomp.saul.datamodel.node.{ Node, NodeProperty }
 import edu.illinois.cs.cogcomp.saul.datamodel.property.{ CombinedDiscreteProperty, Property, PropertyWithWindow }
 import edu.illinois.cs.cogcomp.saul.lbjrelated.LBJLearnerEquivalent
 import edu.illinois.cs.cogcomp.saul.parser.{ IterableToLBJavaParser, LBJavaParserToIterable }
@@ -51,8 +51,12 @@ abstract class Learnable[T <: AnyRef](val node: Node[T], val parameters: Paramet
   def feature: List[Property[T]] = node.properties.toList
 
   /** filter out the label from the features */
-  def combinedProperties = if (label != null) new CombinedDiscreteProperty[T](this.feature.filterNot(_.name == label.name))
-  else new CombinedDiscreteProperty[T](this.feature)
+  def combinedProperties = {
+    val features = if (label != null) this.feature.filterNot(_.name == label.name) else this.feature
+
+    // Support Feature Vector Caching during training.
+    new CombinedDiscreteProperty[T](features, supportsFeatureVectorCaching = true)
+  }
 
   def lbpFeatures = Property.convertToClassifier(combinedProperties)
 

diff --git a/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/DataModel.scala b/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/DataModel.scala
@@ -160,7 +160,34 @@ trait DataModel extends Logging {
     e
   }
 
-  class PropertyApply[T <: AnyRef] private[DataModel] (val node: Node[T], name: String, cache: Boolean, ordered: Boolean) {
+  /** Helper class to facilitate creating new [[Property]] instances.
+    *
+    * Note:
+    * - The `cache` parameter is used to cache a property sensor's value within a single training iteration. This is
+    *   useful if properties are defined recursively.
+    * - The `cacheFeatureVector` parameter caches the FeatureVector for instances of this property. Thus, feature
+    *   extraction is performed only once during the training/testing process. This can lead to an increase in RAM
+    *   usage but will lead to speed-up in training iterations. Recommended to use with static features which have high
+    *   feature extraction effort.
+    *
+    * @param node [[Node]] instance to add the current property to.
+    * @param name Name of the property.
+    * @param cache Boolean indicating if this property sensor's value should be cached within training iterations.
+    * @param ordered Denoting if the order among the values in this property needs to be preserved. Only applies to
+    *                collection based properties.
+    * @param cacheFeatureVector Boolean indicating if this property's feature vector should be cached during
+    *                           training/testing. Caching feature vector saves redundant feature extraction during
+    *                           training/testing.
+    * @tparam T Data type of the node that this property is associated with.
+    * @return [[PropertyApply]] instance
+    */
+  class PropertyApply[T <: AnyRef] private[DataModel] (
+    val node: Node[T],
+    name: String,
+    cache: Boolean,
+    ordered: Boolean,
+    cacheFeatureVector: Boolean
+  ) {
     papply =>
 
     // TODO(danielk): make the hashmaps immutable
@@ -174,7 +201,11 @@ trait DataModel extends Logging {
 
     def apply(f: T => Boolean)(implicit tag: ClassTag[T]): BooleanProperty[T] = {
       def cachedF = if (cache) { x: T => getOrUpdate(x, f).asInstanceOf[Boolean] } else f
-      val a = new BooleanProperty[T](name, cachedF) with NodeProperty[T] { override def node: Node[T] = papply.node }
+      val a = new BooleanProperty[T](name, cachedF) with NodeProperty[T] {
+        override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
+      }
+
       papply.node.properties += a
       properties += a
       a
@@ -186,10 +217,12 @@ trait DataModel extends Logging {
       val a = if (ordered) {
         new RealArrayProperty[T](name, newf) with NodeProperty[T] {
           override def node: Node[T] = papply.node
+          override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
         }
       } else {
         new RealGenProperty[T](name, newf) with NodeProperty[T] {
           override def node: Node[T] = papply.node
+          override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
         }
       }
       papply.node.properties += a
@@ -203,6 +236,7 @@ trait DataModel extends Logging {
       val newf: T => Double = { t => cachedF(t).toDouble }
       val a = new RealProperty[T](name, newf) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
@@ -215,6 +249,7 @@ trait DataModel extends Logging {
       def cachedF = if (cache) { x: T => getOrUpdate(x, f).asInstanceOf[List[Double]] } else f
       val a = new RealCollectionProperty[T](name, cachedF, ordered) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
@@ -227,6 +262,7 @@ trait DataModel extends Logging {
       def cachedF = if (cache) { x: T => getOrUpdate(x, f).asInstanceOf[Double] } else f
       val a = new RealProperty[T](name, cachedF) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
@@ -239,6 +275,7 @@ trait DataModel extends Logging {
       def cachedF = if (cache) { x: T => getOrUpdate(x, f).asInstanceOf[String] } else f
       val a = new DiscreteProperty[T](name, cachedF, None) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
@@ -251,6 +288,7 @@ trait DataModel extends Logging {
       def cachedF = if (cache) { x: T => getOrUpdate(x, f).asInstanceOf[List[String]] } else f
       val a = new DiscreteCollectionProperty[T](name, cachedF, !ordered) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
@@ -265,15 +303,37 @@ trait DataModel extends Logging {
       val r = range.toList
       val a = new DiscreteProperty[T](name, cachedF, Some(r)) with NodeProperty[T] {
         override def node: Node[T] = papply.node
+        override val cacheFeatureVector: Boolean = papply.cacheFeatureVector
       }
       papply.node.properties += a
       properties += a
       a
     }
   }
 
-  def property[T <: AnyRef](node: Node[T], name: String = "prop" + properties.size, cache: Boolean = false, ordered: Boolean = false) =
-    new PropertyApply[T](node, name, cache, ordered)
+  /** Function to create a new [[Property]] instance inside a DataModel.
+    *
+    * Note:
+    * - The `cache` parameter is used to cache a property sensor's value within a single training iteration. This is
+    *   useful if properties are defined recursively.
+    * - The `cacheFeatureVector` parameter caches the FeatureVector for instances of this property. Thus, feature
+    *   extraction is performed only once during the training/testing process. This can lead to an increase in RAM
+    *   usage but will lead to speed-up in training iterations. Recommended to use with static features which have high
+    *   feature extraction effort.
+    *
+    * @param node [[Node]] instance to add the current property to.
+    * @param name Name of the property.
+    * @param cache Boolean indicating if this property sensor's value should be cached within training iterations.
+    * @param ordered Denoting if the order among the values in this property needs to be preserved. Only applies to
+    *                collection based properties.
+    * @param cacheFeatureVector Boolean indicating if this property's feature vector should be cached during
+    *                           training/testing. Caching feature vector saves redundant feature extraction during
+    *                           training/testing.
+    * @tparam T Data type of the node that this property is associated with.
+    * @return Property instance wrapped in a helper class [[PropertyApply]]
+    */
+  def property[T <: AnyRef](node: Node[T], name: String = "prop" + properties.size, cache: Boolean = false, ordered: Boolean = false, cacheFeatureVector: Boolean = false) =
+    new PropertyApply[T](node, name, cache, ordered, cacheFeatureVector)
 
   /** Methods for caching Data Model */
   var hasDerivedInstances = false

diff --git a/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/node/Node.scala b/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/node/Node.scala
@@ -80,11 +80,16 @@ class Node[T <: AnyRef](val keyFunc: T => Any = (x: T) => x, val tag: ClassTag[T
   }
 
   def clear(): Unit = {
+    // Clear property caches
+    propertyCacheList.foreach(_.clear())
+    propertyFeatureVectorCache.clear()
+
     collection.clear
     trainingSet.clear
     testingSet.clear
-    for (e <- incoming) e.clear
-    for (e <- outgoing) e.clear
+
+    for (e <- incoming) e.clear()
+    for (e <- outgoing) e.clear()
   }
 
   private var count: AtomicInteger = new AtomicInteger()
@@ -312,8 +317,11 @@ class Node[T <: AnyRef](val keyFunc: T => Any = (x: T) => x, val tag: ClassTag[T
     }
   }
 
+  /** WeakHashMap instance to cache property's [[FeatureVector]] instances during training/testing */
+  private[saul] final val propertyFeatureVectorCache = new mutable.WeakHashMap[T, mutable.HashMap[Property[_], FeatureVector]]()
+
   /** list of hashmaps used inside properties for caching sensor values */
-  final val propertyCacheList = new ListBuffer[MutableHashMap[_, Any]]()
+  private[saul] final val propertyCacheList = new ListBuffer[MutableHashMap[_, Any]]()
 
   def clearPropertyCache(): Unit = {
     if (propertyCacheList.nonEmpty) {

diff --git a/...main/scala/edu/illinois/cs/cogcomp/saul/datamodel/property/CombinedDiscreteProperty.scala b/...main/scala/edu/illinois/cs/cogcomp/saul/datamodel/property/CombinedDiscreteProperty.scala
@@ -6,13 +6,22 @@
   */
 package edu.illinois.cs.cogcomp.saul.datamodel.property
 
-import java.util
-
 import edu.illinois.cs.cogcomp.lbjava.classify.{ Classifier, FeatureVector }
+import edu.illinois.cs.cogcomp.saul.datamodel.node.NodeProperty
+
+import java.util
 
+import scala.collection.mutable
 import scala.reflect.ClassTag
 
-case class CombinedDiscreteProperty[T <: AnyRef](atts: List[Property[T]])(implicit val tag: ClassTag[T]) extends TypedProperty[T, List[_]] {
+/** Represents a collection of properties.
+  *
+  * @param atts List of properties (attributes).
+  * @param supportsFeatureVectorCaching Boolean to denote if feature vector caching should be supported.
+  * @param tag ClassTag of the property's input type.
+  * @tparam T Property's input type.
+  */
+case class CombinedDiscreteProperty[T <: AnyRef](atts: List[Property[T]], supportsFeatureVectorCaching: Boolean = false)(implicit val tag: ClassTag[T]) extends TypedProperty[T, List[_]] {
 
   override val sensor: (T) => List[_] = {
     t: T => atts.map(att => att.sensor(t))
@@ -26,7 +35,21 @@ case class CombinedDiscreteProperty[T <: AnyRef](atts: List[Property[T]])(implic
 
   override def featureVector(instance: T): FeatureVector = {
     val featureVector = new FeatureVector()
-    atts.foreach(property => featureVector.addFeatures(property.featureVector(instance)))
+    atts.foreach(property => {
+      val extractedFeatureVector = {
+        // Handle caching of Feature Vector
+        if (supportsFeatureVectorCaching && property.cacheFeatureVector && property.isInstanceOf[NodeProperty[T]]) {
+          val nodeProperty = property.asInstanceOf[NodeProperty[T]]
+          val instanceCacheMap = nodeProperty.node.propertyFeatureVectorCache
+            .getOrElseUpdate(instance, new mutable.HashMap[Property[_], FeatureVector]())
+          instanceCacheMap.getOrElseUpdate(property, property.featureVector(instance))
+        } else {
+          property.featureVector(instance)
+        }
+      }
+
+      featureVector.addFeatures(extractedFeatureVector)
+    })
     featureVector
   }
 

diff --git a/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/property/Property.scala b/saul-core/src/main/scala/edu/illinois/cs/cogcomp/saul/datamodel/property/Property.scala
@@ -28,6 +28,8 @@ trait Property[T] {
 
   val sensor: T => S
 
+  val cacheFeatureVector: Boolean = false
+
   def apply(instance: T): S = sensor(instance)
 
   def featureVector(instance: T): FeatureVector

diff --git a/saul-core/src/test/scala/edu/illinois/cs/cogcomp/saul/datamodel/propertyTest.scala b/saul-core/src/test/scala/edu/illinois/cs/cogcomp/saul/datamodel/propertyTest.scala
@@ -6,6 +6,8 @@
   */
 package edu.illinois.cs.cogcomp.saul.datamodel
 
+import edu.illinois.cs.cogcomp.lbjava.learn.{ SparseNetworkLearner, SparsePerceptron }
+import edu.illinois.cs.cogcomp.saul.classifier.Learnable
 import edu.illinois.cs.cogcomp.saul.datamodel.property.PairwiseConjunction
 import org.scalatest._
 
@@ -56,6 +58,55 @@ class propertyTest extends FlatSpec with Matchers {
       Set(p1.name, p2.name, p3.name).size should be(3)
     }
   }
+
+  "property feature vector caching" should "work" in {
+    var counterNonStatic: Int = 0
+    var counterStatic: Int = 0
+
+    object testModel extends DataModel {
+      val n = node[String]
+
+      val testLabel = property(n) { s: String => s }
+      val nonStaticProperty = property(n) { s: String => counterNonStatic += 1; s }
+      val staticProperty = property(n, cacheFeatureVector = true) { s: String => counterStatic += 1; s }
+    }
+
+    import testModel._
+
+    object testClassifier extends Learnable[String](n) {
+      def label = testLabel
+      override lazy val classifier = new SparseNetworkLearner()
+      override def feature = using(staticProperty, nonStaticProperty)
+    }
+
+    val dataset = List("test", "testSecond")
+
+    n.populate(dataset)
+    testClassifier.learn(5)
+
+    counterNonStatic should be(10) // 5 iterations * 2 items
+    counterStatic should be(2) // 2 items
+
+    // To indicate that sensor values are not cached
+    nonStaticProperty("test")
+    staticProperty("test")
+
+    counterNonStatic should be(11)
+    counterStatic should be(3)
+
+    // To indicate that feature vectors are only cached in the training workflow
+    // Accessing featureVector directly does not return cached value.
+    nonStaticProperty.featureVector("test")
+    staticProperty.featureVector("test")
+
+    counterNonStatic should be(12)
+    counterStatic should be(4)
+
+    testClassifier.learn(5)
+
+    counterNonStatic should be(22)
+    counterStatic should be(4)
+  }
 }
 
 object toyDataModel extends DataModel {