Comment

PavelCz · PavelCz · commit a2bc763d19d3 · 2022-12-09T21:16:18.000+01:00
diff --git a/src/reward_preprocessing/vis/reward_vis.py b/src/reward_preprocessing/vis/reward_vis.py
@@ -263,14 +263,21 @@ def vis_traditional(
             feature_list = [feature_list]
 
         obj = sum(
-            # Original with cosine similarity:
+            # Original with cosine similarity (for if we go back to interpreting neuron
+            # directions in intermediate layers_:
             # [
             #     objectives_rfi.direction_neuron_dim_agnostic(
             #         self.layer_name, self.channel_dirs[feature], batch=feature
             #     )
             #     for feature in feature_list
             # ]
             # New:
+            # Sum up all objectives such that we simultaneously optimize for all.
+            # Each objective maximizes the output for one of the activations (in this
+            # case equivalent to the reward for the respective actions, or overall
+            # reward if we don't differentiate between actions) and depends only on the
+            # input at that same index.
+            # In other words, each input maximizes its respective activation.
             [
                 objectives_rfi.max_index_1d(self.layer_name, feature, batch=feature)
                 for feature in feature_list