Professional Documents
Culture Documents
# Moving average of the gradients. Inputs: "v, grads, beta1". Output: "v".
# (approx. 2 lines)
# v["dW" + str(l)] = ...
# v["db" + str(l)] = ...
# YOUR CODE STARTS HERE
v['dW' + str(l)] = beta1 * v['dW' + str(l)] + (1 - beta1) * grads['dW' +
str(l)]
v['db' + str(l)] = beta1 * v['dw' + str(l)] + (1 - beta1) * grads['db' +
str(l)]
# YOUR CODE ENDS HERE
# Compute bias-corrected second raw moment estimate. Inputs: "s, beta2, t".
Output: "s_corrected".
# (approx. 2 lines)
# s_corrected["dW" + str(l)] = ...
# s_corrected["db" + str(l)] = ...
# YOUR CODE STARTS HERE
s_corrected['dW' + str(l)] = s['dW' + str(l)]/(1 - np.power(beta2,t))
s_corrected['db' + str(l)] = s['db' + str(l)]/(1 - np.power(beta2,t))
# YOUR CODE ENDS HERE