Add support for non-scalar datasets.

ponder-lab · Jan 5, 2024 · e9e3f57 · e9e3f57
1 parent f694adb
commit e9e3f57
Show file tree

Hide file tree

Showing 4 changed files with 199 additions and 34 deletions.
diff --git a/...wala.cast.python.ml.test/source/com/ibm/wala/cast/python/ml/test/TestTensorflowModel.java b/...wala.cast.python.ml.test/source/com/ibm/wala/cast/python/ml/test/TestTensorflowModel.java
@@ -209,6 +209,7 @@ public void testTf2()
     testTf2("tf2_test_dataset5.py", "add", 2, 2, 2, 3);
     testTf2("tf2_test_dataset6.py", "add", 2, 2, 2, 3);
     testTf2("tf2_test_dataset7.py", "add", 2, 2, 2, 3);
+    testTf2("tf2_test_dataset8.py", "add", 2, 2, 2, 3);
     testTf2("tf2_test_tensor_list.py", "add", 2, 3, 2, 3);
     testTf2("tf2_test_tensor_list2.py", "add", 0, 2);
     testTf2("tf2_test_tensor_list3.py", "add", 0, 2);
@@ -222,6 +223,7 @@ public void testTf2()
     testTf2("tf2_test_callbacks2.py", "replica_fn", 1, 4, 2);
     testTf2("tensorflow_gan_tutorial.py", "train_step", 1, 10, 2);
     testTf2("tensorflow_gan_tutorial2.py", "train_step", 1, 10, 2);
+    testTf2("tensorflow_eager_execution.py", "MyModel.call", 1, 5, 3);
   }
 
   private void testTf2(

diff --git a/....cast.python.ml/source/com/ibm/wala/cast/python/ml/client/PythonTensorAnalysisEngine.java b/....cast.python.ml/source/com/ibm/wala/cast/python/ml/client/PythonTensorAnalysisEngine.java
@@ -125,47 +125,76 @@ private static Set<PointsToSetVariable> getDataflowSources(
           // the individual elements themselves as sources instead.
           if (!definitionIsNonScalar(eachElementGetInstruction, du)) {
             // Find the potential tensor iterable definition.
-            int use = eachElementGetInstruction.getUse(0);
-            SSAInstruction def = du.getDef(use);
-
-            if (def == null) {
-              logger.info(
-                  () ->
-                      "Can't find potential tensor iterable definition for use: "
-                          + use
-                          + " of instruction: "
-                          + eachElementGetInstruction
-                          + ". Trying interprocedural analysis...");
-
-              // Look up the use in the pointer analysis to see if it points to a dataset.
-              PointerKey usePointerKey =
-                  pointerAnalysis.getHeapModel().getPointerKeyForLocal(localPointerKeyNode, use);
-
-              for (InstanceKey ik : pointerAnalysis.getPointsToSet(usePointerKey)) {
-                if (ik instanceof AllocationSiteInNode) {
-                  AllocationSiteInNode asin = (AllocationSiteInNode) ik;
-                  IClass concreteType = asin.getConcreteType();
-                  TypeReference reference = concreteType.getReference();
-
-                  if (reference.equals(DATASET)) {
-                    sources.add(src);
-                    logger.info("Added dataflow source from tensor dataset: " + src + ".");
-                    break;
-                  }
-                }
-              }
-            } else if (definesTensorIterable(
-                def, localPointerKeyNode, callGraph, pointerAnalysis)) {
-              sources.add(src);
-              logger.info("Added dataflow source from tensor iterable: " + src + ".");
-            }
+            processInstruction(
+                eachElementGetInstruction,
+                du,
+                localPointerKeyNode,
+                src,
+                sources,
+                callGraph,
+                pointerAnalysis);
+          }
+        } else if (inst instanceof PythonPropertyRead) {
+          // We are potentially pulling a tensor out of a non-scalar tensor iterable.
+          PythonPropertyRead propertyRead = (PythonPropertyRead) inst;
+
+          // Find the potential tensor iterable definition.
+          int objectRef = propertyRead.getObjectRef();
+          SSAInstruction def = du.getDef(objectRef);
+
+          if (def instanceof EachElementGetInstruction || def instanceof PythonPropertyRead) {
+            processInstruction(
+                def, du, localPointerKeyNode, src, sources, callGraph, pointerAnalysis);
           }
         }
       }
     }
     return sources;
   }
 
+  private static void processInstruction(
+      SSAInstruction instruction,
+      DefUse du,
+      CGNode localPointerKeyNode,
+      PointsToSetVariable src,
+      Set<PointsToSetVariable> sources,
+      CallGraph callGraph,
+      PointerAnalysis<InstanceKey> pointerAnalysis) {
+    int use = instruction.getUse(0);
+    SSAInstruction def = du.getDef(use);
+
+    if (def == null) {
+      logger.info(
+          () ->
+              "Can't find potential tensor iterable definition for use: "
+                  + use
+                  + " of instruction: "
+                  + instruction
+                  + ". Trying interprocedural analysis...");
+
+      // Look up the use in the pointer analysis to see if it points to a dataset.
+      PointerKey usePointerKey =
+          pointerAnalysis.getHeapModel().getPointerKeyForLocal(localPointerKeyNode, use);
+
+      for (InstanceKey ik : pointerAnalysis.getPointsToSet(usePointerKey)) {
+        if (ik instanceof AllocationSiteInNode) {
+          AllocationSiteInNode asin = (AllocationSiteInNode) ik;
+          IClass concreteType = asin.getConcreteType();
+          TypeReference reference = concreteType.getReference();
+
+          if (reference.equals(DATASET)) {
+            sources.add(src);
+            logger.info("Added dataflow source from tensor dataset: " + src + ".");
+            break;
+          }
+        }
+      }
+    } else if (definesTensorIterable(def, localPointerKeyNode, callGraph, pointerAnalysis)) {
+      sources.add(src);
+      logger.info("Added dataflow source from tensor iterable: " + src + ".");
+    }
+  }
+
   /**
    * True iff the given {@link EachElementGetInstruction} constitutes individual elements.
    *

diff --git a/com.ibm.wala.cast.python.test/data/tensorflow_eager_execution.py b/com.ibm.wala.cast.python.test/data/tensorflow_eager_execution.py
@@ -0,0 +1,122 @@
+#!/usr/bin/env python
+
+import sys
+import numpy as np
+import tensorflow as tf
+import tensorflow.keras as keras
+
+
+class MyModel(keras.Model):
+
+    def __init__(self):
+        super(MyModel, self).__init__()
+        self.conv1 = keras.layers.Conv2D(32, 3, activation="relu")
+        self.flatten = keras.layers.Flatten()
+        self.d1 = keras.layers.Dense(128, activation="relu")
+        self.d2 = keras.layers.Dense(10, activation="softmax")
+
+    def call(self, x):
+        x = self.conv1(x)
+        x = self.flatten(x)
+        x = self.d1(x)
+        x = self.d2(x)
+        return x
+
+
+@tf.function
+def train_step(model, fn_loss, fn_accuracy, images, labels):
+    with tf.GradientTape() as tape:
+        predictions = model(images)
+        loss = loss_object(labels, predictions)
+    gradients = tape.gradient(loss, model.trainable_variables)
+    optimizer.apply_gradients(zip(gradients, model.trainable_variables))
+
+    fn_loss(loss)
+    fn_accuracy(labels, predictions)
+
+
+@tf.function
+def test_step(model, fn_loss, fn_accuracy, images, labels):
+    predictions = model(images)
+    t_loss = loss_object(labels, predictions)
+
+    fn_loss(t_loss)
+    fn_accuracy(labels, predictions)
+
+
+#
+# Prepare training data
+#
+validation_split = 0.2
+
+(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()
+
+x_train = x_train.astype(np.float32) / 255.0
+x_test = x_test.astype(np.float32) / 255.0
+
+num_train = int(x_train.shape[0] * (1.0 - validation_split))
+x_valid = x_train[num_train:, ..., tf.newaxis]
+y_valid = y_train[num_train:]
+x_train = x_train[:num_train, ..., tf.newaxis]
+y_train = y_train[:num_train]
+
+x_test = x_test[..., tf.newaxis]
+
+train_ds = tf.data.Dataset.from_tensor_slices((x_train, y_train)).shuffle(10000).batch(32)
+valid_ds = tf.data.Dataset.from_tensor_slices((x_valid, y_valid)).batch(32)
+test_ds = tf.data.Dataset.from_tensor_slices((x_test, y_test)).batch(32)
+
+#
+# Model and loss functions
+#
+model = MyModel()
+
+loss_object = tf.keras.losses.SparseCategoricalCrossentropy()
+optimizer = tf.keras.optimizers.Adam()
+
+train_loss = tf.keras.metrics.Mean(name="train_loss")
+train_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name="train_accuracy")
+
+valid_loss = tf.keras.metrics.Mean(name="validation_loss")
+valid_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name="validation_accuracy")
+
+test_loss = tf.keras.metrics.Mean(name="test_loss")
+test_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name="test_accuracy")
+
+#
+# Run training
+#
+EPOCHS = 10
+
+min_loss = sys.float_info.max
+for epoch in range(EPOCHS):
+    for images, labels in train_ds:
+        train_step(model, train_loss, train_accuracy, images, labels)
+
+    for valid_images, valid_labels in valid_ds:
+        test_step(model, valid_loss, valid_accuracy, valid_images, valid_labels)
+
+    if valid_loss.result() < min_loss:
+        min_loss = valid_loss.result()
+        min_weights = model.get_weights()
+
+    template = "Epoch {}, Loss: {:.4f}, Acc: {:.4f}, Val Loss: {:.4f}, Val Acc: {:.4f}, Min Loss: {:.4f}"
+    print(template.format(epoch + 1,
+                          train_loss.result(),
+                          train_accuracy.result() * 100,
+                          valid_loss.result(),
+                          valid_accuracy.result() * 100,
+                          min_loss))
+
+    train_loss.reset_states()
+    train_accuracy.reset_states()
+    valid_loss.reset_states()
+    valid_accuracy.reset_states()
+
+model.set_weights(min_weights)
+
+for test_images, test_labels in test_ds:
+    test_step(model, test_loss, test_accuracy, test_images, test_labels)
+
+print("Test Loss: {:.4f}, Test Accuracy: {:.4f}".format(test_loss.result(), test_accuracy.result()))
+
diff --git a/com.ibm.wala.cast.python.test/data/tf2_test_dataset8.py b/com.ibm.wala.cast.python.test/data/tf2_test_dataset8.py
@@ -0,0 +1,12 @@
+import tensorflow as tf
+
+
+def add(a, b):
+    return a + a
+
+
+(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()
+dataset = tf.data.Dataset.from_tensor_slices((x_train, y_train)).shuffle(10000).batch(32)
+
+for images, labels in dataset:
+    c = add(images, labels)