Default to wrapping optimizer.Apply in learner variable_scope.

Jonathan Shen · copybara-github · commit 0468a8d490bc · 2021-12-09T13:36:57.000-08:00
optimizer.Apply can create variables. The variables created by different
optimizers can conflict with the same name in eager mode (there is no variable
name auto-uniquification in eager mode). Thus manually wrapping them in a
variable scope is necessary.

Also delete an unused function.

PiperOrigin-RevId: 415344496
diff --git a/lingvo/core/learner.py b/lingvo/core/learner.py
@@ -224,30 +224,13 @@ def Apply(self, metrics, vmap, gradient_mask=None, gradient_adjuster=None):
     else:
       lr_or_callable = lr
 
-    var_update_op = tf.group(
-        [tpu_emb_update_op,
-         self.optimizer.Apply(lr_or_callable, var_grads)])
+    with self._SelfVariableScope():
+      var_update_op = tf.group(
+          [tpu_emb_update_op,
+           self.optimizer.Apply(lr_or_callable, var_grads)])
 
     return losses, var_update_op, eval_metrics
 
-  def ComputeActivationGradients(self, activations, activations_grad, vmap):
-    p = self.params
-    vmap = self.GetTrainableVariables(vmap)
-
-    for v in vmap.Flatten():
-      tf.logging.info('%s: bprop variable: %s', p.name, v.name)
-    return self.optimizer.ComputeGradients(
-        activations,
-        vmap,
-        p.grad_aggregation_method,
-        p.colocate_gradients_with_ops,
-        p.gate_gradients,
-        compute_gradients_fn=self._CustomComputeGradientsFn(),
-        skip_zero_gradients=p.skip_zero_gradients,
-        skip_none_gradients=False,
-        activations_grad=activations_grad,
-        is_activations=True)
-
   def ComputeLosses(self, metrics):
     p = self.params