import tensorflow as tf
from delay_loss_scale import DenseLossScaleOptimizer, SparseLossScaleOptimizer
from mx_rec.util.initialize import ConfigInitializer
from mx_rec.optimizers.gradient_descent_by_addr import create_hash_optimizer_by_addr
from mx_rec.optimizers.gradient_descent import create_hash_optimizer
from mx_rec.optimizers import lazy_adam
def get_dense_and_sparse_optimizer(cfg):
use_dynamic_expansion = ConfigInitializer.get_instance().use_dynamic_expansion
if cfg.use_lazy_adam_optimizer:
if use_dynamic_expansion:
raise RuntimeError("model is incompatible with dynamic_expansion when use lazy_adam optimizer.")
dense_optimizer = tf.compat.v1.train.AdamOptimizer(learning_rate=cfg.learning_rate[0])
sparse_optimizer = lazy_adam.create_hash_optimizer(learning_rate=cfg.learning_rate[1])
loss_scale = 65536
else:
dense_optimizer = tf.compat.v1.train.GradientDescentOptimizer(learning_rate=cfg.learning_rate[0])
if use_dynamic_expansion:
sparse_optimizer = create_hash_optimizer_by_addr(learning_rate=cfg.learning_rate[1], weight_decay=0.0001)
else:
sparse_optimizer = create_hash_optimizer(
learning_rate=cfg.learning_rate[1], weight_decay=0.0001, use_fusion_optim=cfg.use_fusion_optim)
loss_scale = 1024
sparse_optimizer = SparseLossScaleOptimizer(sparse_optimizer, loss_scale)
dense_optimizer = DenseLossScaleOptimizer(dense_optimizer, loss_scale)
return dense_optimizer, sparse_optimizer