Slide 67
Slide 67 text
What can be distributed?
def SGD(X, Y, Loss, GradLoss, W0, s):
W = W0
lastLoss = Double.Inf
for i = 0 .. maxIterations:
W = W - s * GradLoss(W, X, Y)
currentLoss = Loss(Model(W), X, Y)
if abs(currentLoss - lastLoss) > eps:
lastLoss = currentLoss
else:
break
return Model(W)