Optimization, Minimization & Fitting Notes & Recipes#
import numpy as np
from scipy import optimize
import matplotlib.pyplot as plt
np.random.seed(371)
def g(x,mu,sigma):
return -np.exp(-(x-mu)**2/(2*sigma**2))
x = np.linspace(0,15,100)
mu = 5
sigma = 1
plt.plot(x,g(x,mu,sigma))
plt.show()
data:image/s3,"s3://crabby-images/8abcc/8abcca256a8263c818b49f034a784274d0d299ac" alt="_images/a1760a2745e81524ee4ba80a03f8841893c5e232f129a330c2f0a7c755ee9cf5.png"
optimize.minimize(g,x0=2,args=(mu,sigma))
fun: -1.0
hess_inv: array([[1.00023666]])
jac: array([0.])
message: 'Optimization terminated successfully.'
nfev: 24
nit: 3
njev: 12
status: 0
success: True
x: array([5.])
Gradient Descent Algorithm#
Parabol#
def f(x,abc):
return abc[0]*x**2+abc[1]*x+abc[2]
def g(x,abc):
# Derivative
return 2*abc[0]*x+abc[1]
xx = np.linspace(-5,10,100)
abc = np.array([2,3,-4])
plt.plot(xx,f(xx,abc))
plt.show()
data:image/s3,"s3://crabby-images/07737/0773786ce0cfd100de3acf561f3a24c2579d93b4" alt="_images/b91cca97507d666bd9edd2232e31cb2eae88702fcfd9e849dd666fd2f1cec2db.png"
x = 5
N = 50
eta = .4
tolerance = 1E-4
xs_so_far = [x]
fs_so_far = [f(x,abc)]
for i in range(N):
gg = g(x,abc)
print("Step #{:d}".format(i+1))
print("The derivative (gradient) at x = {:7.5f} is {:5.3f}"\
.format(x,gg))
if(np.abs(gg)<tolerance):
print("\tAs it is sufficiently close to zero, we have found the minima!")
break
elif(gg>0):
print("\tAs it is positive, go left by: "+
"(this amount)*eta(={:.2f}).".format(eta))
else:
print("\tAs it is negative, go right by: "+
"|this amount|*eta(={:.2f}).".format(eta))
delta = -gg*eta
x0 = x
x = x + delta
xs_so_far.append(x)
fs_so_far.append(f(x,abc))
print("\t==> The new x is {:7.5f}{:+7.5f}={:7.5f}".format(x0,delta,x))
plt.plot(xx,f(xx,abc),color="orange")
plt.plot(xs_so_far,fs_so_far,"*-")
plt.show()
print("-"*45)
Step #1
The derivative (gradient) at x = 5.00000 is 23.000
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00000-9.20000=-4.20000
data:image/s3,"s3://crabby-images/42af6/42af6ee1dd82e973ee3382bbcb38ea8edc527b47" alt="_images/214042c14acb0f1c5298e0105213fce954fa69cdcc0b3c57a35f26d129fa9880.png"
---------------------------------------------
Step #2
The derivative (gradient) at x = -4.20000 is -13.800
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -4.20000+5.52000=1.32000
data:image/s3,"s3://crabby-images/92295/92295e8ab414f9ca641ae2bbf391977401ec96e7" alt="_images/7ed722d9327b7b8ef000acec300020bb07652d6e3b4873a21d62de93a3d17ba7.png"
---------------------------------------------
Step #3
The derivative (gradient) at x = 1.32000 is 8.280
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 1.32000-3.31200=-1.99200
data:image/s3,"s3://crabby-images/82168/82168b53494df95abb4873ad35aaff50c321d3ef" alt="_images/6c3304d22e99cd301ab76a84a4b6273b14c83fa9b7c7d17a2a3048bcc5525ece.png"
---------------------------------------------
Step #4
The derivative (gradient) at x = -1.99200 is -4.968
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -1.99200+1.98720=-0.00480
data:image/s3,"s3://crabby-images/2844e/2844e7494999d480854c7ff6e8392f5d12af50fc" alt="_images/de00290c9074a7054790165530e8644fc7db4bc31af2ada6e0007e8b4ce35925.png"
---------------------------------------------
Step #5
The derivative (gradient) at x = -0.00480 is 2.981
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.00480-1.19232=-1.19712
data:image/s3,"s3://crabby-images/e0411/e0411f230e6d41cea6ffc548338cc6dc535a0f2f" alt="_images/c4ac4b7270c491e5460c1ef9ac606287b37b0db4973aec8f2de6d8882e52660b.png"
---------------------------------------------
Step #6
The derivative (gradient) at x = -1.19712 is -1.788
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -1.19712+0.71539=-0.48173
data:image/s3,"s3://crabby-images/90dbc/90dbcf6dc1ceb3a4f5227eff9e5b7173f0df4aab" alt="_images/2c6e96adab9c4cbf9ee15b5f409d914d3656632ab2790a9995d0f443a2b9f9c6.png"
---------------------------------------------
Step #7
The derivative (gradient) at x = -0.48173 is 1.073
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.48173-0.42924=-0.91096
data:image/s3,"s3://crabby-images/e644d/e644d88afc1d58ff27857ceb8a978cac7709316c" alt="_images/e1d2685741e36922cd00d0175d4803fefb21309da96ca739b2f73341a336565b.png"
---------------------------------------------
Step #8
The derivative (gradient) at x = -0.91096 is -0.644
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.91096+0.25754=-0.65342
data:image/s3,"s3://crabby-images/5667e/5667e7ddcf439afc46f39bf66d231c4c3f66aef1" alt="_images/33ff63fd3ad75c0c96f664f1af34f98589a522e34500eefe9d572efc4f051bcf.png"
---------------------------------------------
Step #9
The derivative (gradient) at x = -0.65342 is 0.386
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.65342-0.15452=-0.80795
data:image/s3,"s3://crabby-images/31307/3130753f1a0ecd5b1647710215092d7eca050be9" alt="_images/76ca9c37954e68d4826844703297c236d48ef15a104c074b17cdd5d61b41c289.png"
---------------------------------------------
Step #10
The derivative (gradient) at x = -0.80795 is -0.232
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.80795+0.09271=-0.71523
data:image/s3,"s3://crabby-images/262be/262bedf34778983e16dff20b5ff3aafd15cc6e6a" alt="_images/11da8d23bed550662a3490073d5a7bcdcfdb9a14290dbf5e984ddf7ad34f4ec8.png"
---------------------------------------------
Step #11
The derivative (gradient) at x = -0.71523 is 0.139
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.71523-0.05563=-0.77086
data:image/s3,"s3://crabby-images/ca4fa/ca4fa53cea974b3a65da63b9e22e2a535358c970" alt="_images/8efd0838890c0755cac3a8bd9e9432e918e83a95ce1e56f50d940f0f6dc2bd44.png"
---------------------------------------------
Step #12
The derivative (gradient) at x = -0.77086 is -0.083
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.77086+0.03338=-0.73748
data:image/s3,"s3://crabby-images/70383/703839eb85e34ebfd03f4282fcf9c9b97e1eca9e" alt="_images/327056065cb613e5fb9e563162e0f3e36c9c6061e35d56df80fa33e4a90ecde3.png"
---------------------------------------------
Step #13
The derivative (gradient) at x = -0.73748 is 0.050
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.73748-0.02003=-0.75751
data:image/s3,"s3://crabby-images/c6103/c610399c7f11204f30f4e104c135b85b9888e82f" alt="_images/7bb5bb27281091a63a006081c1340c7ff8b2ae66c0931361fc1f742b83d76315.png"
---------------------------------------------
Step #14
The derivative (gradient) at x = -0.75751 is -0.030
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75751+0.01202=-0.74549
data:image/s3,"s3://crabby-images/27a7c/27a7cf48eb1587de4535a867023db2818fbab5dc" alt="_images/85f3c77b90a2260e2d86f0ab809e470d9498da9142741a4f07bb6a5354293d76.png"
---------------------------------------------
Step #15
The derivative (gradient) at x = -0.74549 is 0.018
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74549-0.00721=-0.75270
data:image/s3,"s3://crabby-images/96047/96047c04af1d0bb43168ba40c2cb2cf9df78c9fb" alt="_images/69b3a72fe2917c50c9358493f641c9a24e3a671c0f25d32a88f26ad01550aab4.png"
---------------------------------------------
Step #16
The derivative (gradient) at x = -0.75270 is -0.011
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75270+0.00433=-0.74838
data:image/s3,"s3://crabby-images/4eabb/4eabb5508b6d0e4946fb51e1589c8ca46ef3e883" alt="_images/0ed7d72e50051c48ba23d52957b2d006e03e34e0214cbe8a64950aae0c57eca2.png"
---------------------------------------------
Step #17
The derivative (gradient) at x = -0.74838 is 0.006
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74838-0.00260=-0.75097
data:image/s3,"s3://crabby-images/2b599/2b5992339cb17ab03d8cc0b58214687eff06638a" alt="_images/e480df3a4e8a9f493d4a799ea6e60ab72d5c272e82e08b87b11e7d65c8a52e5f.png"
---------------------------------------------
Step #18
The derivative (gradient) at x = -0.75097 is -0.004
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75097+0.00156=-0.74942
data:image/s3,"s3://crabby-images/80ec0/80ec0efaa974457f3bb8009e885bab7ef7993882" alt="_images/494d6400cf894f8b0740cdc4ee93a746f4ae207b3ddcf791f7c122734a8f9d1a.png"
---------------------------------------------
Step #19
The derivative (gradient) at x = -0.74942 is 0.002
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74942-0.00093=-0.75035
data:image/s3,"s3://crabby-images/4e8ea/4e8ea9ac24108b5fab49208c2a71f7181f0cf797" alt="_images/d9e73cf437a2bfff01e4ffe155efb70c16e0117b9da6f03246def2a21b3431b2.png"
---------------------------------------------
Step #20
The derivative (gradient) at x = -0.75035 is -0.001
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75035+0.00056=-0.74979
data:image/s3,"s3://crabby-images/7cc3e/7cc3e4d27fc00709f0716b4360302cc3b5b978f2" alt="_images/cec672047075ebf2ea480dc288f7741eddaf595bfd7da26d9a662bc9a2c247b4.png"
---------------------------------------------
Step #21
The derivative (gradient) at x = -0.74979 is 0.001
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74979-0.00034=-0.75013
data:image/s3,"s3://crabby-images/f90b9/f90b9d07bfc2e111bf46131cb9d857ee907eaeba" alt="_images/673216174d4865ab1502bb0c3e9e0778fe4f32031406f6397a17be5ef5dfa4e7.png"
---------------------------------------------
Step #22
The derivative (gradient) at x = -0.75013 is -0.001
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75013+0.00020=-0.74992
data:image/s3,"s3://crabby-images/dae5f/dae5f4c7b3f8086d3a425a5a759c7158e91c7570" alt="_images/90a298ec5ef61f7523ace18ddf4898b81f15d26aecc0d7c6383eb3d533c02731.png"
---------------------------------------------
Step #23
The derivative (gradient) at x = -0.74992 is 0.000
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74992-0.00012=-0.75005
data:image/s3,"s3://crabby-images/7a373/7a3735e39af24ca62eeddcef7637b6e20ae885cb" alt="_images/9cc386ce831f58422f282203aa63089aa71815a232b8960f550d1edc17e64b79.png"
---------------------------------------------
Step #24
The derivative (gradient) at x = -0.75005 is -0.000
As it is negative, go right by: |this amount|*eta(=0.40).
==> The new x is -0.75005+0.00007=-0.74997
data:image/s3,"s3://crabby-images/bebf4/bebf40cbbdf1c4dd21277c14ba3c9b6d250e6431" alt="_images/7073fd668d3b789326ae2eac3db8026965379f96320efe5cbb1d17a7de449710.png"
---------------------------------------------
Step #25
The derivative (gradient) at x = -0.74997 is 0.000
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is -0.74997-0.00004=-0.75002
data:image/s3,"s3://crabby-images/e9f72/e9f720c45fa1c58e4774db5cc634294e34c82bdd" alt="_images/eea0ca77f8fa67091832cbbccc06feabc7fc50cce38b3d240834a8d1e54e2180.png"
---------------------------------------------
Step #26
The derivative (gradient) at x = -0.75002 is -0.000
As it is sufficiently close to zero, we have found the minima!
# Real minimum:
np.roots([2*abc[0],abc[1]]) # root of 2ax + b
array([-0.75])
“Negative” Gaussian#
def f(x,mu,sigma):
return -np.exp(-(x-mu)**2/(2*sigma**2))
def g(x,mu,sigma):
return (x-mu)/(sigma**2)*np.exp(-(x-mu)**2/(2*sigma**2))
mu = 5
sigma = 1
xx = np.linspace(0,15,100)
plt.plot(xx,f(xx,mu,sigma))
plt.show()
data:image/s3,"s3://crabby-images/8abcc/8abcca256a8263c818b49f034a784274d0d299ac" alt="_images/a1760a2745e81524ee4ba80a03f8841893c5e232f129a330c2f0a7c755ee9cf5.png"
x = 8
N = 60
eta = .4
tolerance = 1E-4
xs_so_far = [x]
fs_so_far = [f(x,mu,sigma)]
for i in range(N):
gg = g(x,mu,sigma)
print("Step #{:d}".format(i+1))
print("The derivative (gradient) at x = {:7.5f} is {:5.4f}"\
.format(x,gg))
if(np.abs(gg)<tolerance):
print("\tAs it is sufficiently close to zero, we have found the minima!")
break
elif(gg>0):
print("\tAs it is positive, go left by: "+
"(this amount)*eta(={:.2f}).".format(eta))
else:
print("\tAs it is negative, go right by: "+
"|this amount|*eta(={:.2f}).".format(eta))
delta = -gg*eta
x0 = x
x = x + delta
xs_so_far.append(x)
fs_so_far.append(f(x,mu,sigma))
print("\t==> The new x is {:7.5f}{:+7.5f}={:7.5f}".format(x0,delta,x))
plt.plot(xx,f(xx,mu,sigma),color="orange")
plt.plot(xs_so_far,fs_so_far,"*-")
plt.show()
print("-"*45)
Step #1
The derivative (gradient) at x = 8.00000 is 0.0333
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 8.00000-0.01333=7.98667
data:image/s3,"s3://crabby-images/e2927/e2927ba421e88420da6e92ab3a19132d7816c767" alt="_images/19e2cf037d901d0325bbc976a4a5364357e7a209da05789f79c26bccafebcc15.png"
---------------------------------------------
Step #2
The derivative (gradient) at x = 7.98667 is 0.0345
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.98667-0.01381=7.97286
data:image/s3,"s3://crabby-images/d81e1/d81e10c19e4bd6bb1f45233c033bc89bd3492eef" alt="_images/171f344434a82b1f8f3a3a6e4ea84758ec49b46b5364782c07507868e21782cc.png"
---------------------------------------------
Step #3
The derivative (gradient) at x = 7.97286 is 0.0358
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.97286-0.01433=7.95853
data:image/s3,"s3://crabby-images/b3764/b37642555e3f1168a2fd2fcb587418c291162f43" alt="_images/880ed4770f9d625e067b66fcdd0fae9b0beda88579530b7dd224429b835874b6.png"
---------------------------------------------
Step #4
The derivative (gradient) at x = 7.95853 is 0.0372
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.95853-0.01488=7.94366
data:image/s3,"s3://crabby-images/0fef3/0fef37ec29a9936e276ef0895406b88d67a073f0" alt="_images/0c52d5893890f65a135f99ff78fbd93b81c74b3f3cdc17d593cf032c4afc0659.png"
---------------------------------------------
Step #5
The derivative (gradient) at x = 7.94366 is 0.0387
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.94366-0.01546=7.92819
data:image/s3,"s3://crabby-images/6b55d/6b55d10040b4f6a561cba81e17853a7ead66b771" alt="_images/677c9f8c0e8ba4edf54f5e74e51a31251483412adc32ccd9ed6c2e72a368a5a9.png"
---------------------------------------------
Step #6
The derivative (gradient) at x = 7.92819 is 0.0402
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.92819-0.01610=7.91209
data:image/s3,"s3://crabby-images/5dc8b/5dc8b7a4d5af14284f9747107910b5e2eeee54ec" alt="_images/c8b4cd52033e22a71b55d010cb5a23b3d7f51b0cada4677dd1117b3cc107e41c.png"
---------------------------------------------
Step #7
The derivative (gradient) at x = 7.91209 is 0.0420
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.91209-0.01678=7.89531
data:image/s3,"s3://crabby-images/3ab75/3ab754f56efee98f86e0706d20167f6ce02b2ed0" alt="_images/8ed5b995697c025ca5c35436833a6aeed17ccafd625067cb12eec0be007d3797.png"
---------------------------------------------
Step #8
The derivative (gradient) at x = 7.89531 is 0.0438
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.89531-0.01752=7.87780
data:image/s3,"s3://crabby-images/2d41d/2d41df8210b1b49f8b342bcf31f1112ec246c4f0" alt="_images/bb6944bdeab0becf73ef78be28bd7327c07d864bc6f81ef8d5571313ea850a32.png"
---------------------------------------------
Step #9
The derivative (gradient) at x = 7.87780 is 0.0458
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.87780-0.01831=7.85948
data:image/s3,"s3://crabby-images/2d1f6/2d1f618383dd1ec3b44a6bd4ed0a3dd57dc7339b" alt="_images/f61573d26e8c77a057056d00227e613641a2d60b50f54b43c08557cfbb313a51.png"
---------------------------------------------
Step #10
The derivative (gradient) at x = 7.85948 is 0.0479
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.85948-0.01918=7.84031
data:image/s3,"s3://crabby-images/cbed1/cbed16c996d4737d0b6fffe13b7c94ba151eda4d" alt="_images/5b1e80efd67cc6bac28cedfb1120cdb7f2b908e94413f4d52727ca6b605518ef.png"
---------------------------------------------
Step #11
The derivative (gradient) at x = 7.84031 is 0.0503
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.84031-0.02012=7.82019
data:image/s3,"s3://crabby-images/a67a6/a67a62bbeb8d916ce302b6a33c0bb82dc0ed77d7" alt="_images/378f0399ecdd5f84ad3e1c3850b98f482567ae27f83efa27b8c41e6394490e0c.png"
---------------------------------------------
Step #12
The derivative (gradient) at x = 7.82019 is 0.0529
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.82019-0.02115=7.79904
data:image/s3,"s3://crabby-images/47c1b/47c1b5b01add82eca656faf023ca9a1bc98069c7" alt="_images/030c5dac2afec508eab470cf39f1a8031e806ee37c8d9f8eacbab2ddcb0e5bfe.png"
---------------------------------------------
Step #13
The derivative (gradient) at x = 7.79904 is 0.0557
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.79904-0.02227=7.77676
data:image/s3,"s3://crabby-images/53e98/53e98650c54011d4ad061f6df70a04e44bef4ce0" alt="_images/8c695f419bb30a5421ce32373f0bd436730d68acdb8a4d05cbe654d76015d22e.png"
---------------------------------------------
Step #14
The derivative (gradient) at x = 7.77676 is 0.0588
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.77676-0.02351=7.75325
data:image/s3,"s3://crabby-images/0455f/0455f192a74d98dbf799797d30e161a367e19202" alt="_images/ba62879153acf752fcd18b94d6f038fc891310e213f5a1d966acb44695c937f0.png"
---------------------------------------------
Step #15
The derivative (gradient) at x = 7.75325 is 0.0622
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.75325-0.02488=7.72837
data:image/s3,"s3://crabby-images/bd06f/bd06fb1d3c0a878148fc035e7afe15c584d4d36c" alt="_images/e7ac55f5f8bcbf711668a926dcb709720e4dfcab74b644855281f45e60566063.png"
---------------------------------------------
Step #16
The derivative (gradient) at x = 7.72837 is 0.0660
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.72837-0.02639=7.70198
data:image/s3,"s3://crabby-images/ee39f/ee39fc721c9a8e7b7ed99af3b7752616d8ce40d1" alt="_images/a427f5a7f9d12eb9c755121332ad39e8c26fa2b679f3947adcdf1daeed9eb9ca.png"
---------------------------------------------
Step #17
The derivative (gradient) at x = 7.70198 is 0.0702
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.70198-0.02808=7.67389
data:image/s3,"s3://crabby-images/bf1d2/bf1d2b46aa0584f813f4192246bc60f63b137d7b" alt="_images/1b877fc43bf4525790d37c83cf899c66bf9d07ed99bd71ea9add2935f79b4926.png"
---------------------------------------------
Step #18
The derivative (gradient) at x = 7.67389 is 0.0749
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.67389-0.02997=7.64393
data:image/s3,"s3://crabby-images/bfeeb/bfeeb1728b557c76404310e65cbae9bb2de8f1c5" alt="_images/cb87ac0b761d5c5791ecd4adc2a62e1b3e766b70695ec492e34645be75e0647c.png"
---------------------------------------------
Step #19
The derivative (gradient) at x = 7.64393 is 0.0802
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.64393-0.03209=7.61184
data:image/s3,"s3://crabby-images/cf59c/cf59cd3e0eaee7668500aa662cd7613c4a3131ae" alt="_images/952bbe2e5dee31a380fe3a7646f45f772f685e00e1d1620139f25bf4777da2c3.png"
---------------------------------------------
Step #20
The derivative (gradient) at x = 7.61184 is 0.0862
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.61184-0.03449=7.57735
data:image/s3,"s3://crabby-images/4941a/4941a4dc4b165782bf181f045140b951d4393fee" alt="_images/a8b2cf5bf3823c68d01d3407ee29d91ac700de397b29be79cff7e77790b9bd76.png"
---------------------------------------------
Step #21
The derivative (gradient) at x = 7.57735 is 0.0931
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.57735-0.03722=7.54012
data:image/s3,"s3://crabby-images/d04bc/d04bcf387939ac6ba77f640cff1344dbcf1131e1" alt="_images/675d8e7e2a9166982a9a10d2ef2acfe9bc070cb811eaa2cc90866355f9bf33bb.png"
---------------------------------------------
Step #22
The derivative (gradient) at x = 7.54012 is 0.1009
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.54012-0.04035=7.49978
data:image/s3,"s3://crabby-images/6c07f/6c07f6ad11f9ae3f4b185b8ebf73ae775e875209" alt="_images/6be98950e2585a18ca9ad9949e53d4a2ac39879857ca48f90c2221f79091bb08.png"
---------------------------------------------
Step #23
The derivative (gradient) at x = 7.49978 is 0.1099
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.49978-0.04396=7.45582
data:image/s3,"s3://crabby-images/6cba3/6cba36e939a41823551209a36f8bd75c70d4dc78" alt="_images/9fe2b58417b91cd7a38a37344851c3d76ba9d239e9d819da0420c9adea3708da.png"
---------------------------------------------
Step #24
The derivative (gradient) at x = 7.45582 is 0.1204
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.45582-0.04815=7.40766
data:image/s3,"s3://crabby-images/987d0/987d0881b521d3cae6f9b1583bcdebafc3c219f2" alt="_images/8c40ad2d3032d31cb3e5f4ef9d7b373c8b8f047ee043222203b7d44285f7f3e6.png"
---------------------------------------------
Step #25
The derivative (gradient) at x = 7.40766 is 0.1327
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.40766-0.05307=7.35459
data:image/s3,"s3://crabby-images/85f1f/85f1fbedeea5a543fce790580fa40a01b52ed503" alt="_images/5c8af3a3da1336c752f1f6f4f92113d6e091355068cacd59837de202f11b1252.png"
---------------------------------------------
Step #26
The derivative (gradient) at x = 7.35459 is 0.1472
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.35459-0.05890=7.29569
data:image/s3,"s3://crabby-images/0e18a/0e18a0976950847b5d9bc9d4bf0606111344cb98" alt="_images/4bd203c2c6be70a901e5e99b236b276d925fc7d5f976a19858a5e422bc33ccb4.png"
---------------------------------------------
Step #27
The derivative (gradient) at x = 7.29569 is 0.1646
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.29569-0.06585=7.22984
data:image/s3,"s3://crabby-images/e2c9b/e2c9be4bafed277eb61728c18d4e5c0903b3ec6a" alt="_images/86101dbd05edb45a301e36c5277e861d57fd37db044dc2d32aff5850968fb4ee.png"
---------------------------------------------
Step #28
The derivative (gradient) at x = 7.22984 is 0.1856
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.22984-0.07424=7.15560
data:image/s3,"s3://crabby-images/54d2e/54d2ec86e32692f941d7bb60446865e579ff32e3" alt="_images/acbf678a2c6eff2d6c8be688a2535016d86a703c3f8e78732325fbfacf5660bd.png"
---------------------------------------------
Step #29
The derivative (gradient) at x = 7.15560 is 0.2111
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.15560-0.08446=7.07115
data:image/s3,"s3://crabby-images/fcb6b/fcb6b0b6dc13c082847d34ea72032d97ac5cca11" alt="_images/dd4cb631c1aeb3bf50466b6a363e57db6995069320383e250db33eb46a6d9427.png"
---------------------------------------------
Step #30
The derivative (gradient) at x = 7.07115 is 0.2425
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 7.07115-0.09700=6.97414
data:image/s3,"s3://crabby-images/40773/407738f58144fd50c1154a0213b683620f13ca13" alt="_images/5d8191044a4500adba44bc73c619b1243fc9ec54ec9ea58f75daf20776d1e298.png"
---------------------------------------------
Step #31
The derivative (gradient) at x = 6.97414 is 0.2813
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.97414-0.11250=6.86164
data:image/s3,"s3://crabby-images/0d7c6/0d7c654dc6b817e21c9477e00965017fc0e5c9f8" alt="_images/d60bed6c02958bc0bac712071cd18275207fa39a1c185de667488d2f4f0fb9f3.png"
---------------------------------------------
Step #32
The derivative (gradient) at x = 6.86164 is 0.3291
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.86164-0.13164=6.73000
data:image/s3,"s3://crabby-images/ba841/ba841f8dabfd01b65c4bc8798dc272da508250fe" alt="_images/390bc75c26b508d6908321d33b5e6abb5caea8dff347dbcae11b487fd3b6cddb.png"
---------------------------------------------
Step #33
The derivative (gradient) at x = 6.73000 is 0.3874
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.73000-0.15495=6.57505
data:image/s3,"s3://crabby-images/533e1/533e190968da7fd7b64d51807781604f9c34a351" alt="_images/b325c37e408c9d53ed03d93197d259194b257ea57b2b4c1e47a84934ffd4f3ea.png"
---------------------------------------------
Step #34
The derivative (gradient) at x = 6.57505 is 0.4556
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.57505-0.18225=6.39280
data:image/s3,"s3://crabby-images/5853a/5853a7af8b4dd244bfe82c0e6aee436a7fafe8e1" alt="_images/58680011b25c48446b5bc1982eac5239c99cdf678b8755c285fe4ba792db011c.png"
---------------------------------------------
Step #35
The derivative (gradient) at x = 6.39280 is 0.5280
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.39280-0.21121=6.18159
data:image/s3,"s3://crabby-images/d7ee9/d7ee98c2e1f76a32bbc3bdf1c9777b65fb77878e" alt="_images/110f8c5c8bd64e268b871ef43381ff18b9975898f2689af51fba5f194481a543.png"
---------------------------------------------
Step #36
The derivative (gradient) at x = 6.18159 is 0.5879
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 6.18159-0.23516=5.94644
data:image/s3,"s3://crabby-images/0b876/0b87667eb54ca3eb788231f1472c65d8cc1f08c9" alt="_images/07f2fb028b3781268b35377c12d3c881d789aa7c8796d5642217bd88859f7309.png"
---------------------------------------------
Step #37
The derivative (gradient) at x = 5.94644 is 0.6048
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.94644-0.24190=5.70453
data:image/s3,"s3://crabby-images/77cb1/77cb1fc67fd11e359ba6ae2c7dc7bfb1f0485c79" alt="_images/51909271bcac9e8b9d657980a87aa17b015b2f164ddd378a9c05581bbae5fce5.png"
---------------------------------------------
Step #38
The derivative (gradient) at x = 5.70453 is 0.5497
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.70453-0.21988=5.48466
data:image/s3,"s3://crabby-images/381ad/381ad3ee6d6c4ad3cc5e6b19a7d5634f496f586b" alt="_images/284eae138e6c13b3af63f1451724560ce42a9d75c5642f4267785680add61450.png"
---------------------------------------------
Step #39
The derivative (gradient) at x = 5.48466 is 0.4310
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.48466-0.17238=5.31228
data:image/s3,"s3://crabby-images/14b47/14b47ab5cf429a6b322d01c93df72dba97abcc64" alt="_images/afa1e40e6e405863a3fbbfffffcafcab179e9876bead690b03e8cef5b290409b.png"
---------------------------------------------
Step #40
The derivative (gradient) at x = 5.31228 is 0.2974
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.31228-0.11897=5.19331
data:image/s3,"s3://crabby-images/2828b/2828b66f2be135ee7e236a3a5718c6486aeb88b7" alt="_images/9c27ee01ae4bfbe351915516e6a414eb4f3646c375330a18c72ccb68b485d101.png"
---------------------------------------------
Step #41
The derivative (gradient) at x = 5.19331 is 0.1897
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.19331-0.07589=5.11742
data:image/s3,"s3://crabby-images/b0c06/b0c06c7b3c0f38562a9323b857f69310b791ed9e" alt="_images/37a28514a5a339496d5d96cea03b308a607bfbc0f153e94a15b5486de249f469.png"
---------------------------------------------
Step #42
The derivative (gradient) at x = 5.11742 is 0.1166
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.11742-0.04664=5.07077
data:image/s3,"s3://crabby-images/3871a/3871a90c3767feaaf0a31ae0cf445bb66de4849e" alt="_images/5a83cbe6327bec0dfe76ba8b690b4fda5e857f42f98c8dfb0b0567e3617b8a37.png"
---------------------------------------------
Step #43
The derivative (gradient) at x = 5.07077 is 0.0706
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.07077-0.02824=5.04253
data:image/s3,"s3://crabby-images/5db2d/5db2d5e9ac3ded7bf918b9ba88b5564c55cdcd04" alt="_images/663f30ab10773d7bb4826d18a256822a6b7f67d9bc9d5b0db83a60f34d75d862.png"
---------------------------------------------
Step #44
The derivative (gradient) at x = 5.04253 is 0.0425
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.04253-0.01700=5.02554
data:image/s3,"s3://crabby-images/90673/90673acfabc827bb237af1193d42fc67ed39259f" alt="_images/4e3b5be4841732bfe05264a93168f783eb0595c9dc1079c7bfab629132567941.png"
---------------------------------------------
Step #45
The derivative (gradient) at x = 5.02554 is 0.0255
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.02554-0.01021=5.01533
data:image/s3,"s3://crabby-images/bf031/bf0319c9e817d953afef9f3103046ee24491e272" alt="_images/9aa9715117d77f35ee74a0e8f9ca6fe4386891776f36cc80c2317361674ead1e.png"
---------------------------------------------
Step #46
The derivative (gradient) at x = 5.01533 is 0.0153
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.01533-0.00613=5.00920
data:image/s3,"s3://crabby-images/8fd96/8fd969d3620591245ea8fecf57cd4bb284c766ac" alt="_images/96d561ac80127c55c1c64a314fe9cdacc3582a75828cf713897f286dae0bebb6.png"
---------------------------------------------
Step #47
The derivative (gradient) at x = 5.00920 is 0.0092
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00920-0.00368=5.00552
data:image/s3,"s3://crabby-images/02e3b/02e3b2e92a59cbd5b48438c14757e6a487f8551d" alt="_images/1cf14716cf63d2e4274d9a29159fd2a4e5a2eaf5a37ab683bed07c7b348a82ab.png"
---------------------------------------------
Step #48
The derivative (gradient) at x = 5.00552 is 0.0055
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00552-0.00221=5.00331
data:image/s3,"s3://crabby-images/ac42f/ac42f82451583a20f79139946d48a28ca899c10a" alt="_images/18ecfe978ae34da8a992b54cde6a24881ffbd22d66e1b463fdf379d8237a425d.png"
---------------------------------------------
Step #49
The derivative (gradient) at x = 5.00331 is 0.0033
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00331-0.00132=5.00199
data:image/s3,"s3://crabby-images/4852a/4852a1789baec64a19a25585263dcde96f001ca8" alt="_images/dd46278bf025b6ec15754197753fe821793213f67480e3f52e379253f4589af2.png"
---------------------------------------------
Step #50
The derivative (gradient) at x = 5.00199 is 0.0020
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00199-0.00079=5.00119
data:image/s3,"s3://crabby-images/70d94/70d94d0c84c94a9300acbea7141e62c0d83b0305" alt="_images/50bdd6a5fcffa4ceceeda944a2e09bd303f0cf4ae52024f5c14e9abd710f4ed6.png"
---------------------------------------------
Step #51
The derivative (gradient) at x = 5.00119 is 0.0012
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00119-0.00048=5.00072
data:image/s3,"s3://crabby-images/4a908/4a908ba09e31a8f355749e9f6986eea3607d9cd0" alt="_images/c0dd886b05ab7403f6ea781358817162e98487bb361fe95a3101934445fa542a.png"
---------------------------------------------
Step #52
The derivative (gradient) at x = 5.00072 is 0.0007
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00072-0.00029=5.00043
data:image/s3,"s3://crabby-images/06238/062383d9257ba1e99553ccdca206734675f7b64b" alt="_images/014859e3ed487907a4b70cde2dbdc744ab8f3d67b109648e98076746ec9682d4.png"
---------------------------------------------
Step #53
The derivative (gradient) at x = 5.00043 is 0.0004
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00043-0.00017=5.00026
data:image/s3,"s3://crabby-images/c6adb/c6adb1cda126b2c139224c5be30748879bc44fce" alt="_images/a6498c51d62ec2f33ea375b33cfc2d8b1d9f0edf9e3d98499d29f2d0f9a3e8d1.png"
---------------------------------------------
Step #54
The derivative (gradient) at x = 5.00026 is 0.0003
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00026-0.00010=5.00015
data:image/s3,"s3://crabby-images/036a4/036a45f09b3bb8976c408c55041c118795662d3e" alt="_images/bdea1a1aa3d1e123a3937daf3d4c05883a3bd77596a3a9128893b4d0995babec.png"
---------------------------------------------
Step #55
The derivative (gradient) at x = 5.00015 is 0.0002
As it is positive, go left by: (this amount)*eta(=0.40).
==> The new x is 5.00015-0.00006=5.00009
data:image/s3,"s3://crabby-images/f786e/f786e5c0e81ceca6c71ca07431e052fe5520d5a7" alt="_images/d05d9d692afd40b5444ff05301bf736fea07bbd5597a1d33ad36f88bc787d220.png"
---------------------------------------------
Step #56
The derivative (gradient) at x = 5.00009 is 0.0001
As it is sufficiently close to zero, we have found the minima!
Fitting parameters via gradient descent algorithm#
mu = 5
sigma = 1
N = 10
x = np.random.rand(N)*4+3
t = f(x,mu,sigma)
xx = np.linspace(3,7,100)
plt.plot(xx,f(xx,mu,sigma),color="orange")
plt.plot(x,t,"o")
plt.show()
data:image/s3,"s3://crabby-images/fc128/fc128e6e30333caece56d4ebcdecb234bf4284ea" alt="_images/8b717ceac463ae1b396c7444767d9a91fc515bd6c19e6c3ed98099ea95a83884.png"
\(\newcommand{\diff}{\text{d}} \newcommand{\dydx}[2]{\frac{\text{d}#1}{\text{d}#2}} \newcommand{\ddydx}[2]{\frac{\text{d}^2#1}{\text{d}#2^2}} \newcommand{\pypx}[2]{\frac{\partial#1}{\partial#2}} \newcommand{\unit}[1]{\,\text{#1}}\)
We have the data points, we know the function but we don’t have the mu & sigma.
The function we are going to try to minimize will be the difference between the real values (\(\{t_i\}\)) corresponding to \(\{x_i\}\) and the projected values (\(\{y_i\}\)):
Begin by calculating the derivatives:
(don’t forget that \(\{x_i\}\) and \(\{t_i\}\) are fixed!)
Can you see the problem in this approach? As \(\{t_i\}\) are fixed, the problem is reduced to finding the \((\mu,\sigma)\) set that will make \(f(x_i;\mu,\sigma)\) minimum, regardless of \(\{t_i\}\) values. If we follow this approach, we will end up with \((\mu,\sigma)\) that will most likely fix the values all very close to 0.
You are invited to try this approach, i.e.,
def F_mu(x,mu,sigma):
return (x-mu)/sigma**2*np.exp(-(x-mu)**2/(2*sigma**2))
def F_sigma(x,mu,sigma):
return (x-mu)**2/sigma**3*np.exp(-(x-mu)**2/(2*sigma**2))
But what we really have in mind is the fact that, for a given \(x_i\), we want to find values as close to the corresponding \(t_i\) as possible. One way to obtain this would be to define the error function as:
and then we would have the following derivatives:
(Evaluated via WolframAlpha: 1, 2)
def F_mu(x,t,mu,sigma):
return 2*(x-mu)/sigma**2*np.exp(-(x-mu)**2/(2*sigma**2))*\
(t+np.exp(-(x-mu)**2/(2*sigma**2)))
def F_sigma(x,t,mu,sigma):
return 2*(x-mu)**2/sigma**3*np.exp(-(x-mu)**2/(2*sigma**2))*\
(t+np.exp(-(x-mu)**2/(2*sigma**2)))
np.array([x,t]).T
array([[ 5.68303007, -0.79194365],
[ 5.29078268, -0.95860394],
[ 4.17595952, -0.71211109],
[ 6.24959654, -0.45806428],
[ 4.41660884, -0.84351919],
[ 6.96423794, -0.14527666],
[ 6.53987834, -0.30555892],
[ 4.86294066, -0.99065134],
[ 3.3056984 , -0.23803705],
[ 6.23655758, -0.46554928]])
eta = 1
# Starting values
mu_opt = 2.7
sigma_opt = 2.3
tolerance = 1E-4
for i in range(10000):
for ii in range(x.size):
xi = x[ii]
ti = t[ii]
#print(xi,ti)
F_mu_xi = F_mu(xi,ti,mu_opt,sigma_opt)
F_sigma_xi = F_sigma(xi,ti,mu_opt,sigma_opt)
mu_opt -= eta*F_mu_xi
sigma_opt -= eta*F_sigma_xi
total_absolute_error = np.sum(np.abs(t-f(x,mu_opt,sigma_opt)))
if(total_absolute_error < tolerance):
print(("As the sum of the absolute errors is sufficiently close to zero ({:.7f}),\n"+
"\tbreaking the iteration at the {:d}. step!").
format(total_absolute_error,i+1))
break
print("mu: {:.4f}\tsigma: {:.4f}".format(mu_opt,sigma_opt))
plt.plot(xx,f(xx,mu,sigma),color="orange")
plt.plot(xx,f(xx,mu_opt,sigma_opt),":b")
plt.plot(x,t,"o")
plt.show()
As the sum of the absolute errors is sufficiently close to zero (0.0000034),
breaking the iteration at the 44. step!
mu: 5.0000 sigma: 1.0000
data:image/s3,"s3://crabby-images/69818/69818db4ef6372c0d40ae9cb2d4b2a1ea90c5a7f" alt="_images/5d65b56f16c318f47c15a47c14b086f54077243c592e5492bf68dfe55f8858a3.png"
Stochastic Gradient Descent Algorithm#
In this approach, instead of optimizing the variables at every step for one data point, we optimize them as a whole:
eta = 0.1
# Starting values
mu_opt = 2.7
sigma_opt = 2.3
tolerance = 1E-4
total_absolute_error0 = 1000
for i in range(10000):
d_mu = -eta*np.sum(F_mu(x,t,mu_opt,sigma_opt))
d_sigma = -eta*np.sum(F_sigma(x,t,mu_opt,sigma_opt))
mu_opt += d_mu
sigma_opt += d_sigma
total_absolute_error = np.sum(np.abs(t-f(x,mu_opt,sigma_opt)))
if(total_absolute_error < tolerance):
print(("As the sum of the absolute errors is sufficiently close to zero ({:.7f}),\n"+
"\tbreaking the iteration at the {:d}. step!").
format(total_absolute_error,i+1))
break
print("mu: {:.4f}\tsigma: {:.4f}".format(mu_opt,sigma_opt))
plt.plot(xx,f(xx,mu,sigma),color="orange")
plt.plot(xx,f(xx,mu_opt,sigma_opt),":b")
plt.plot(x,t,"o")
plt.show()
As the sum of the absolute errors is sufficiently close to zero (0.0000838),
breaking the iteration at the 473. step!
mu: 5.0000 sigma: 1.0000
data:image/s3,"s3://crabby-images/5eef3/5eef37b44c08a2a6f6795de13e78f84a6e92b58d" alt="_images/50a44d62a36b3fd1f11894e18015ccdea1529675761737736e5a22ce3ad9aed2.png"
def F(musigma,x,t):
return np.sum((t + np.exp(-(x-musigma[0])**2/(2*musigma[1]**2)))**2)
opt = optimize.minimize(F,x0=(2.7,2.3),args=(x,t))
opt.x,opt.fun
(array([-0.94939593, 6.24977685]), 0.7517808253037702)
opt = optimize.minimize(F,x0=(2.7,2.3),args=(x,t),bounds=[(3,6.5),(None,None)])
opt.x,opt.fun
(array([5.00000008, 0.99999998]), 1.0592809689731542e-14)