Professional Documents
Culture Documents
UNCUYO
UNIVERSIDAD
NACIONAL DE CUYO
Clasificación de imágenes
❖ Nearest Neighbors
❖ K-Nearest Neighbors
❖ Linear Classifier :
Nos quedaba pendiente
❖ Support Vector Machine
❖ Softmax Classifier
Clasificación lineal
bias x0 = 1
f (x, W ) = W x = Ŵ x + b
<latexit sha1_base64="M3TAK+CWUEoVaxSGqd5n/jwXh4A=">AAACAXicbVDLSgMxFL3js9bXqBvBTbAIFaXMVEE3QtGNywq2U2iHkkkzbWjmQZKRlqFu/BU3LhRx61+4829M21lo64F7OZxzL8k9XsyZVJb1bSwsLi2vrObW8usbm1vb5s5uXUaJILRGIh6Jhocl5SykNcUUp41YUBx4nDpe/2bsOw9USBaF92oYUzfA3ZD5jGClpba57xcHp84xukLOQLdWD6vUGQ1OvLZZsErWBGie2BkpQIZq2/xqdSKSBDRUhGMpm7YVKzfFQjHC6SjfSiSNMenjLm1qGuKASjedXDBCR1rpID8SukKFJurvjRQHUg4DT08GWPXkrDcW//OaifIv3ZSFcaJoSKYP+QlHKkLjOFCHCUoUH2qCiWD6r4j0sMBE6dDyOgR79uR5Ui+X7LNS+e68ULnO4sjBARxCEWy4gArcQhVqQOARnuEV3own48V4Nz6mowtGtrMHf2B8/gCE3JUH</latexit>
<latexit sha1_base64="YN9Q4TjjIqbPTr+J0ZjVFyAk2oE=">AAAB7HicbVBNS8NAEJ34WetX1aOXxSJ4KkkV9CIUvXisYNpCG8pmO2mXbjZhdyOW0t/gxYMiXv1B3vw3btsctPXBwOO9GWbmhang2rjut7Oyura+sVnYKm7v7O7tlw4OGzrJFEOfJSJRrZBqFFyib7gR2EoV0jgU2AyHt1O/+YhK80Q+mFGKQUz7kkecUWMl/6nrXnvdUtmtuDOQZeLlpAw56t3SV6eXsCxGaZigWrc9NzXBmCrDmcBJsZNpTCkb0j62LZU0Rh2MZ8dOyKlVeiRKlC1pyEz9PTGmsdajOLSdMTUDvehNxf+8dmaiq2DMZZoZlGy+KMoEMQmZfk56XCEzYmQJZYrbWwkbUEWZsfkUbQje4svLpFGteOeV6v1FuXaTx1GAYziBM/DgEmpwB3XwgQGHZ3iFN0c6L8678zFvXXHymSP4A+fzB/5PjiU=</latexit>
123 =
<latexit sha1_base64="MWbL6R2hZsQThSAdMNvF0orSXwY=">AAAB6HicbVDLSgNBEOyNrxhfUY9eBoPgKexGQS9C0IvHBMwDkiXMTnqTMbOzy8ysEEK+wIsHRbz6Sd78GyfJHjSxoKGo6qa7K0gE18Z1v53c2vrG5lZ+u7Czu7d/UDw8auo4VQwbLBaxagdUo+ASG4Ybge1EIY0Cga1gdDfzW0+oNI/lgxkn6Ed0IHnIGTVWqt/0iiW37M5BVomXkRJkqPWKX91+zNIIpWGCat3x3MT4E6oMZwKnhW6qMaFsRAfYsVTSCLU/mR86JWdW6ZMwVrakIXP198SERlqPo8B2RtQM9bI3E//zOqkJr/0Jl0lqULLFojAVxMRk9jXpc4XMiLEllClubyVsSBVlxmZTsCF4yy+vkmal7F2UK/XLUvU2iyMPJ3AK5+DBFVThHmrQAAYIz/AKb86j8+K8Ox+L1pyTzRzDHzifP44bjMU=</latexit>
0.3 dog
2 -0.7 30 … 30 … 2 frog
W
<latexit sha1_base64="yxUgNFppSsebkUqo0HdMiZJUGss=">AAAB6HicbVBNS8NAEJ34WetX1aOXxSJ4KkkV9Fj04rEF+wFtKJvtpF272YTdjVBCf4EXD4p49Sd589+4bXPQ1gcDj/dmmJkXJIJr47rfztr6xubWdmGnuLu3f3BYOjpu6ThVDJssFrHqBFSj4BKbhhuBnUQhjQKB7WB8N/PbT6g0j+WDmSToR3QoecgZNVZqtPulsltx5yCrxMtJGXLU+6Wv3iBmaYTSMEG17npuYvyMKsOZwGmxl2pMKBvTIXYtlTRC7WfzQ6fk3CoDEsbKljRkrv6eyGik9SQKbGdEzUgvezPxP6+bmvDGz7hMUoOSLRaFqSAmJrOvyYArZEZMLKFMcXsrYSOqKDM2m6INwVt+eZW0qhXvslJtXJVrt3kcBTiFM7gAD66hBvdQhyYwQHiGV3hzHp0X5935WLSuOfnMCfyB8/kDtYOM3w==</latexit>
x
<latexit sha1_base64="hL+FaLtOT9luwfLW3Ut08xl3Pcw=">AAAB6HicbVDLTgJBEOzFF+IL9ehlIjHxRHbRRI9ELx4hkUcCGzI79MLI7OxmZtZICF/gxYPGePWTvPk3DrAHBSvppFLVne6uIBFcG9f9dnJr6xubW/ntws7u3v5B8fCoqeNUMWywWMSqHVCNgktsGG4EthOFNAoEtoLR7cxvPaLSPJb3ZpygH9GB5CFn1Fip/tQrltyyOwdZJV5GSpCh1it+dfsxSyOUhgmqdcdzE+NPqDKcCZwWuqnGhLIRHWDHUkkj1P5kfuiUnFmlT8JY2ZKGzNXfExMaaT2OAtsZUTPUy95M/M/rpCa89idcJqlByRaLwlQQE5PZ16TPFTIjxpZQpri9lbAhVZQZm03BhuAtv7xKmpWyd1Gu1C9L1ZssjjycwCmcgwdXUIU7qEEDGCA8wyu8OQ/Oi/PufCxac042cwx/4Hz+AOeHjQA=</latexit>
1 X
loss = L(f (xi , W ), yi )
N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
donde S = f (x, W )
Sy i
<latexit sha1_base64="wE/imfAg2AVK8mKbeJLLCFls5Ic=">AAAB7nicbVBNS8NAEJ3Ur1q/qh69LBbBU0lqQY8FLx4r2g9oQ9hsN+3S3U3Y3Qgh9Ed48aCIV3+PN/+N2zYHbX0w8Hhvhpl5YcKZNq777ZQ2Nre2d8q7lb39g8Oj6vFJV8epIrRDYh6rfog15UzSjmGG036iKBYhp71wejv3e09UaRbLR5Ml1Bd4LFnECDZW6j0EeRawWVCtuXV3AbROvILUoEA7qH4NRzFJBZWGcKz1wHMT4+dYGUY4nVWGqaYJJlM8pgNLJRZU+/ni3Bm6sMoIRbGyJQ1aqL8nciy0zkRoOwU2E73qzcX/vEFqohs/ZzJJDZVkuShKOTIxmv+ORkxRYnhmCSaK2VsRmWCFibEJVWwI3urL66TbqHtX9cZ9s9ZqFnGU4QzO4RI8uIYW3EEbOkBgCs/wCm9O4rw4787HsrXkFDOn8AfO5w9/qY+h</latexit>
<latexit sha1_base64="+NU1KmWmPppVa6Y7UEMyRu+aDpU=">AAAB8XicbVBNS8NAEJ3Ur1q/oh69LBahgpSkCnoRil48VrQf2Iay2W7apZtN2N2IJfRfePGgiFf/jTf/jds2B219MPB4b4aZeX7MmdKO823llpZXVtfy64WNza3tHXt3r6GiRBJaJxGPZMvHinImaF0zzWkrlhSHPqdNf3g98ZuPVCoWiXs9iqkX4r5gASNYG+nhDl2ioPR00jzu2kWn7EyBFombkSJkqHXtr04vIklIhSYcK9V2nVh7KZaaEU7HhU6iaIzJEPdp21CBQ6q8dHrxGB0ZpYeCSJoSGk3V3xMpDpUahb7pDLEeqHlvIv7ntRMdXHgpE3GiqSCzRUHCkY7Q5H3UY5ISzUeGYCKZuRWRAZaYaBNSwYTgzr+8SBqVsntartyeFatXWRx5OIBDKIEL51CFG6hBHQgIeIZXeLOU9WK9Wx+z1pyVzezDH1ifP1ZRj2Q=</latexit>
<latexit sha1_base64="bdAS1DU9pLDwmRSuoG8etVlJoIw=">AAAB7XicbVBNS8NAEN34WetX1aOXxSJ4KkkV9FjUg8cK9gPaUDbbSbt2kw27E6GE/gcvHhTx6v/x5r9x2+agrQ8GHu/NMDMvSKQw6Lrfzsrq2vrGZmGruL2zu7dfOjhsGpVqDg2upNLtgBmQIoYGCpTQTjSwKJDQCkY3U7/1BNoIFT/gOAE/YoNYhIIztFKzewsSWa9UdivuDHSZeDkpkxz1Xumr21c8jSBGLpkxHc9N0M+YRsElTIrd1EDC+IgNoGNpzCIwfja7dkJPrdKnodK2YqQz9fdExiJjxlFgOyOGQ7PoTcX/vE6K4ZWfiThJEWI+XxSmkqKi09dpX2jgKMeWMK6FvZXyIdOMow2oaEPwFl9eJs1qxTuvVO8vyrXrPI4COSYn5Ix45JLUyB2pkwbh5JE8k1fy5ijnxXl3PuatK04+c0T+wPn8AWHajwA=</latexit>
Support Vector Machine
❖ Supongamos tenemos sólo 3 clases y 3 ejemplos
<latexit sha1_base64="WML4l4JQNxe8ZE9XW9VSYUKjYgc=">AAAB8XicbVDLSgNBEOyNrxhfUY9eBoPgKexGQS9CUA8eI5gHJkuYnXSSIbOzy8ysEJb8hRcPinj1b7z5N06SPWhiQUNR1U13VxALro3rfju5ldW19Y38ZmFre2d3r7h/0NBRohjWWSQi1QqoRsEl1g03AluxQhoGApvB6GbqN59QaR7JBzOO0Q/pQPI+Z9RY6bFzi8JQckW8brHklt0ZyDLxMlKCDLVu8avTi1gSojRMUK3bnhsbP6XKcCZwUugkGmPKRnSAbUslDVH76eziCTmxSo/0I2VLGjJTf0+kNNR6HAa2M6RmqBe9qfif105M/9JPuYwTg5LNF/UTQUxEpu+THlfIjBhbQpni9lbChlRRZmxIBRuCt/jyMmlUyt5ZuXJ/XqpeZ3Hk4QiO4RQ8uIAq3EEN6sBAwjO8wpujnRfn3fmYt+acbOYQ/sD5/AEHho/W</latexit>
=1
Img. source: Stanford CS231n 2017
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
¿Usamos 1 o 100?
¿De que depende?
Img. source: Stanford CS231n 2017
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
Si delta=1 y W es pequeño,
entonces s ~ 0.
Siendo esto así, ¿qué valor
tiene loss ?
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
X
L= max(0, Sj Syi + )
<latexit sha1_base64="oSv46RYGIiKGpKzVEg5C3GMgK8U=">AAACHXicbVDLSgMxFM34rPVVdekmWISKWmZqQTdCURcuXChaLXTKkElv22iSGZOMWIb+iBt/xY0LRVy4Ef/GtHbh68C9HM65l+SeMOZMG9f9cEZGx8YnJjNT2emZ2bn53MLiuY4SRaFKIx6pWkg0cCahapjhUIsVEBFyuAiv9vv+xQ0ozSJ5ZroxNARpS9ZilBgrBbnyEd7Fvk5EkF5iX8I17gash31BbgvuBj4NLvGm7WlfXcf+AXBD1oJc3i26A+C/xBuSPBriOMi9+c2IJgKkoZxoXffc2DRSogyjHHpZP9EQE3pF2lC3VBIBupEOruvhVas0cStStqTBA/X7RkqE1l0R2klBTEf/9vrif149Ma2dRspknBiQ9OuhVsKxiXA/KtxkCqjhXUsIVcz+FdMOUYQaG2jWhuD9PvkvOS8Vva1i6aScr+wN48igZbSCCshD26iCDtExqiKK7tADekLPzr3z6Lw4r1+jI85wZwn9gPP+CXAwn6c=</latexit>
j6=yi
1 X
loss = L(f (xi , W ), yi )
Img. source: Stanford CS231n 2017 N i
<latexit sha1_base64="yzOireLQ5ztcqr1+6p23MjT8bl4=">AAACGnicbVDLSgNBEJyNrxhfUY9eBoOQQAi7UdCLEPTiQSSCSYRsWGYns8mQ2QczvZKw7Hd48Ve8eFDEm3jxb5w8DppY0FBUddPd5UaCKzDNbyOztLyyupZdz21sbm3v5Hf3miqMJWUNGopQ3rtEMcED1gAOgt1HkhHfFazlDi7HfuuBScXD4A5GEev4pBdwj1MCWnLylg1sCIkIlUrxObY9SWhipclNaqvYdzi+LnrFocPLuFUq45HDS06+YFbMCfAisWakgGaoO/lPuxvS2GcBUEGUaltmBJ2ESOBUsDRnx4pFhA5Ij7U1DYjPVCeZvJbiI610sRdKXQHgifp7IiG+UiPf1Z0+gb6a98bif147Bu+sk/AgioEFdLrIiwWGEI9zwl0uGQUx0oRQyfWtmPaJTgd0mjkdgjX/8iJpVivWcaV6e1KoXcziyKIDdIiKyEKnqIauUB01EEWP6Bm9ojfjyXgx3o2PaWvGmM3soz8wvn4AS++ftA==</latexit>
2
❖ Elastic net (L1 + L2) R(W ) =
<latexit sha1_base64="eVcV3KTxNjHtB3ERmYlv1Ow4uJg=">AAACFnicbVC7SgNBFJ2Nrxhfq5Y2g0GIqHE3FtoEgjaWUcwDkrjMzk6SIbOzy8ysEDap/QAbS3/DxiIigpXY+TdOHoUmHhg495x7uXOPGzIqlWV9G4m5+YXFpeRyamV1bX3D3NwqyyASmJRwwAJRdZEkjHJSUlQxUg0FQb7LSMXtXAz9yh0Rkgb8RnVD0vBRi9MmxUhpyTGPrjOVfZiHdRn5Ttw5ZH1Yd4lCsDKubnPwAPYmRc8x01bWGgHOEntC0oXjwdP9h5cvOuZX3Qtw5BOuMENS1mwrVI0YCUUxI/1UPZIkRLiDWqSmKUc+kY14dFYf7mnFg81A6McVHKm/J2LkS9n1Xd3pI9WW095Q/M+rRap51ogpDyNFOB4vakYMqgAOM4IeFQQr1tUEYUH1XyFuI4Gw0kmmdAj29MmzpJzL2ifZ3JWdLpyDMZJgB+yCDLDBKSiAS1AEJYDBA3gGA/BqPBovxpvxPm5NGJOZbfAHxucPK4yhQA==</latexit>
k,l Wk,l + |Wk,l |
❖ Max norm regularization
❖ Dropout
❖ Batch normalization también aplica un efecto de regularización
Clasificación de imágenes
❖ Nearest Neighbors
❖ K-Nearest Neighbors
❖ Linear Classifier :
❖ Support Vector Machine
❖ Softmax Classifier Nos quedaba pendiente
Softmax Classifier
❖ Al igual que SVM, en Softmax la función de activación
es lineal
f (x, W ) = W x
<latexit sha1_base64="UC8OUwJ6qqWh68UG7aJIY5Xd+fQ=">AAAB8nicbVBNS8NAEN34WetX1aOXxSJUkJJUQS9C0YvHCrYppKFstpt26SYbdifSEvozvHhQxKu/xpv/xm2bg7Y+GHi8N8PMvCARXINtf1srq2vrG5uFreL2zu7efungsKVlqihrUimkagdEM8Fj1gQOgrUTxUgUCOYGw7up7z4xpbmMH2GcMD8i/ZiHnBIwkhdWRufuGb7B7qhbKttVewa8TJyclFGORrf01elJmkYsBiqI1p5jJ+BnRAGngk2KnVSzhNAh6TPP0JhETPvZ7OQJPjVKD4dSmYoBz9TfExmJtB5HgemMCAz0ojcV//O8FMJrP+NxkgKL6XxRmAoMEk//xz2uGAUxNoRQxc2tmA6IIhRMSkUTgrP48jJp1arORbX2cFmu3+ZxFNAxOkEV5KArVEf3qIGaiCKJntErerPAerHerY9564qVzxyhP7A+fwA7OI/q</latexit>
softmax
zi
e
fi (z) = P z
e j
<latexit sha1_base64="UMRc4gjaQ0grXPZIpftDPOJJArg=">AAACEHicbVC7TsMwFHXKq5RXgZHFokKUpSRlgAWpwMLYSvQhNSFyXKd16zxkO0htlI2VhZmVL2BhACFWRja+hBX3MUDLka50fM698r3HCRkVUte/tNTc/MLiUno5s7K6tr6R3dyqiSDimFRxwALecJAgjPqkKqlkpBFygjyHkbrTuxj69RvCBQ38K9kPieWhtk9dipFUkp3dd22aHxzAU2i6HOGYXMcDmyZJbIrIs7tw9O4miZ3N6QV9BDhLjAnJlc4q3w+3h49lO/tptgIcecSXmCEhmoYeSitGXFLMSJIxI0FChHuoTZqK+sgjwopHByVwTykt6AZclS/hSP09ESNPiL7nqE4PyY6Y9obif14zku6JFVM/jCTx8fgjN2JQBnCYDmxRTrBkfUUQ5lTtCnEHqWCkyjCjQjCmT54ltWLBOCoUK0audA7GSIMdsAvywADHoAQuQRlUAQZ34Am8gFftXnvW3rT3cWtKm8xsgz/QPn4A5Y6g4g==</latexit>
j
1 X
loss = L(f (xi , W ), yi ) + R(W )
N i
<latexit sha1_base64="1888QJ1iSX/hhV6ImuBb1q1z9cU=">AAACKXicbVDLSgNBEJz1GeMr6tHLYBASDGE3CnoRgl48iEQxJpANy+xkNhky+2CmVxKW/R0v/ooXBUW9+iNOHgc1FjQUVd10d7mR4ApM88OYm19YXFrOrGRX19Y3NnNb23cqjCVldRqKUDZdopjgAasDB8GakWTEdwVruP3zkd+4Z1LxMLiFYcTaPukG3OOUgJacXNUGNoBEhEql+BTbniQ0sdLkKrVV7DscXxa8wsDhJdwolvDQ4UV8gG2hF3QIvik0ik4ub5bNMfAssaYkj6aoObkXuxPS2GcBUEGUallmBO2ESOBUsDRrx4pFhPZJl7U0DYjPVDsZf5rifa10sBdKXQHgsfpzIiG+UkPf1Z0+gZ76643E/7xWDN5JO+FBFAML6GSRFwsMIR7FhjtcMgpiqAmhkutbMe0RHRbocLM6BOvvy7PkrlK2DsuV66N89WwaRwbtoj1UQBY6RlV0gWqojih6QE/oFb0Zj8az8W58TlrnjOnMDvoF4+sbEDWkjA==</latexit>
Softmax Classifier
✓ ◆ ⇣P ⌘
fy
e i fj
L= log P
e fj = fyi + log j e
j
<latexit sha1_base64="fl4ZaEP98bchUI5EiBkFILd6Oag=">AAACVHicbVFNSxtBGJ5dtWra2lhP4uXFIFhKw6496EVI7cWDBwWjQjYus5N3kzGzH8y8K4Rlf5G/pYd6EPpLvAg6+TgY7QsDD8/HfDwT5Uoa8rx/jruwuPRheWW19vHT57Uv9fWvFyYrtMC2yFSmryJuUMkU2yRJ4VWukSeRwsto+HusX96iNjJLz2mUYzfh/VTGUnCyVFgfnsAh/AhU1odAYUy7EMSaixKvyzgsR6GsqqoMTJGENzDhbqoq0LI/oG/jIMxM8B3m9pgLwCwQ1hte05sMvAf+DDRav9Td85+7zdOwfh/0MlEkmJJQ3JiO7+XULbkmKRRWtaAwmHMx5H3sWJjyBE23nJRSwY5lehBn2q6UYMK+TpQ8MWaURNaZcBqYt9qY/J/WKSg+6JYyzQvCVEwPigsFlMG4YehJjYLUyAIutLR3BTHgtlSy/1CzJfhvn/weXOw1/Z/NvTO/0Tpi01lhW2yb7TKf7bMWO2anrM0E+8seHeY4zoPz5C64S1Or68wyG2xu3LUXJfa2WQ==</latexit>
P
H(p, q) =
<latexit sha1_base64="uF9ZaPtC+2bMtVvUBRSzqDG0NnA=">AAACCHicbZC7SgNBFIZn4y2ut1VLCwdDIAENu7HQRgjapIxgLpANYXYy2QzO7G5mZiUhpLTxHXwCGwtFbH0EG/VB7J1cCk38YeDjP+dw5vxexKhUtv1lJBYWl5ZXkqvm2vrG5pa1vVORYSwwKeOQhaLmIUkYDUhZUcVILRIEcY+Rqnd9MapXb4iQNAyuVD8iDY78gLYpRkpbTWu/mIkOu1l4Bo9cGfNmD0aZXha6LPRhV1PTStk5eyw4D84UUoX09+fHvemXmta72wpxzEmgMENS1h07Uo0BEopiRoamG0sSIXyNfFLXGCBOZGMwPmQI09ppwXYo9AsUHLu/JwaIS9nnnu7kSHXkbG1k/lerx6p92hjQIIoVCfBkUTtmUIVwlApsUUGwYn0NCAuq/wpxBwmElc7O1CE4syfPQyWfc45z+UsnVTgHEyXBHjgAGeCAE1AARVACZYDBLXgAT+DZuDMejRfjddKaMKYzu+CPjLcfHHGbQg==</latexit>
x p(x) log q(x)
f (w)
w(0)
↵rw f (w)
w(1) = w(0) ↵rw f(w)
1 X
loss = L(f (xi , W ), yi ) + R(W )
N i
<latexit sha1_base64="1888QJ1iSX/hhV6ImuBb1q1z9cU=">AAACKXicbVDLSgNBEJz1GeMr6tHLYBASDGE3CnoRgl48iEQxJpANy+xkNhky+2CmVxKW/R0v/ooXBUW9+iNOHgc1FjQUVd10d7mR4ApM88OYm19YXFrOrGRX19Y3NnNb23cqjCVldRqKUDZdopjgAasDB8GakWTEdwVruP3zkd+4Z1LxMLiFYcTaPukG3OOUgJacXNUGNoBEhEql+BTbniQ0sdLkKrVV7DscXxa8wsDhJdwolvDQ4UV8gG2hF3QIvik0ik4ub5bNMfAssaYkj6aoObkXuxPS2GcBUEGUallmBO2ESOBUsDRrx4pFhPZJl7U0DYjPVDsZf5rifa10sBdKXQHgsfpzIiG+UkPf1Z0+gZ76643E/7xWDN5JO+FBFAML6GSRFwsMIR7FhjtcMgpiqAmhkutbMe0RHRbocLM6BOvvy7PkrlK2DsuV66N89WwaRwbtoj1UQBY6RlV0gWqojih6QE/oFb0Zj8az8W58TlrnjOnMDvoF4+sbEDWkjA==</latexit>
X
❖ SVM L= max(0, fj f yi + )
<latexit sha1_base64="KBRpQONXb/XTRP4RQqdVW8LGhE4=">AAACHXicbVBNSwMxEM36WetX1aOXYBEUteyqoBehqAcPHhRsFbplyaazNm2SXZOsWJb+ES/+FS8eFPHgRfw3prUHrT6Y4fHeDMm8MOFMG9f9dEZGx8YnJnNT+emZ2bn5wsJiVcepolChMY/VVUg0cCahYpjhcJUoICLkcBm2j3r+5S0ozWJ5YToJ1AW5lixilBgrBYXdU3yAfZ2KIGthX8IN7gSsi31B7tbcTRwFLbxle9ZTN7B/DNyQ9aBQdEtuH/gv8QakiAY4CwrvfiOmqQBpKCda1zw3MfWMKMMoh27eTzUkhLbJNdQslUSArmf967p41SoNHMXKljS4r/7cyIjQuiNCOymIaephryf+59VSE+3XMyaT1ICk3w9FKccmxr2ocIMpoIZ3LCFUMftXTJtEEWpsoHkbgjd88l9S3S55O6Xt891i+XAQRw4toxW0hjy0h8roBJ2hCqLoHj2iZ/TiPDhPzqvz9j064gx2ltAvOB9frHSfzQ==</latexit>
j6=yi
Optimización
0.2 1.0 2.0 1 190.2 cat w1T xi
·
<latexit sha1_base64="tAawmPWMO4MOOxJ+ZasNr5SHOic=">AAAB8HicbVBNSwMxEJ2tX7V+VT16CRbBU9mtguKp4MVjhX5Juy7ZNG1Dk+ySZNWy9Fd48aCIV3+ON/+NabsHbX0w8Hhvhpl5YcyZNq777eRWVtfWN/Kbha3tnd294v5BU0eJIrRBIh6pdog15UzShmGG03asKBYhp61wdD31Ww9UaRbJuhnH1Bd4IFmfEWysdPcYePd19BSwoFhyy+4MaJl4GSlBhlpQ/Or2IpIIKg3hWOuO58bGT7EyjHA6KXQTTWNMRnhAO5ZKLKj209nBE3RilR7qR8qWNGim/p5IsdB6LELbKbAZ6kVvKv7ndRLTv/RTJuPEUEnmi/oJRyZC0+9RjylKDB9bgoli9lZEhlhhYmxGBRuCt/jyMmlWyt5ZuXJ7XqpeZXHk4QiO4RQ8uIAq3EANGkBAwDO8wpujnBfn3fmYt+acbOYQ/sD5/AEVIY/p</latexit>
90 =
<latexit sha1_base64="MWbL6R2hZsQThSAdMNvF0orSXwY=">AAAB6HicbVDLSgNBEOyNrxhfUY9eBoPgKexGQS9C0IvHBMwDkiXMTnqTMbOzy8ysEEK+wIsHRbz6Sd78GyfJHjSxoKGo6qa7K0gE18Z1v53c2vrG5lZ+u7Czu7d/UDw8auo4VQwbLBaxagdUo+ASG4Ybge1EIY0Cga1gdDfzW0+oNI/lgxkn6Ed0IHnIGTVWqt/0iiW37M5BVomXkRJkqPWKX91+zNIIpWGCat3x3MT4E6oMZwKnhW6qMaFsRAfYsVTSCLU/mR86JWdW6ZMwVrakIXP198SERlqPo8B2RtQM9bI3E//zOqkJr/0Jl0lqULLFojAVxMRk9jXpc4XMiLEllClubyVsSBVlxmZTsCF4yy+vkmal7F2UK/XLUvU2iyMPJ3AK5+DBFVThHmrQAAYIz/AKb86j8+K8Ox+L1pyTzRzDHzifP44bjMU=</latexit>
X
<latexit sha1_base64="yxUgNFppSsebkUqo0HdMiZJUGss=">AAAB6HicbVBNS8NAEJ34WetX1aOXxSJ4KkkV9Fj04rEF+wFtKJvtpF272YTdjVBCf4EXD4p49Sd589+4bXPQ1gcDj/dmmJkXJIJr47rfztr6xubWdmGnuLu3f3BYOjpu6ThVDJssFrHqBFSj4BKbhhuBnUQhjQKB7WB8N/PbT6g0j+WDmSToR3QoecgZNVZqtPulsltx5yCrxMtJGXLU+6Wv3iBmaYTSMEG17npuYvyMKsOZwGmxl2pMKBvTIXYtlTRC7WfzQ6fk3CoDEsbKljRkrv6eyGik9SQKbGdEzUgvezPxP6+bmvDGz7hMUoOSLRaFqSAmJrOvyYArZEZMLKFMcXsrYSOqKDM2m6INwVt+eZW0qhXvslJtXJVrt3kcBTiFM7gAD66hBvdQhyYwQHiGV3hzHp0X5935WLSuOfnMCfyB8/kDtYOM3w==</latexit>
1 X L = max(0, w T
wyTi xi +
loss = L(f (xi , W ), yi ) + R(W ) j xi )
N i j6=yi <latexit sha1_base64="ah7xrA2DAle2RF4ogo7uZLjA5ts=">AAACKXicbZDLSgMxFIYz3q23qks3wSJU1DKjgm6Eoi5cuFCwF+jUIZOeajTJjElGLUNfx42v4kZBUbe+iGmdhbcDgS//fw7J+cOYM21c980ZGBwaHhkdG89NTE5Nz+Rn56o6ShSFCo14pOoh0cCZhIphhkM9VkBEyKEWXu71/No1KM0ieWI6MTQFOZOszSgxVgry5UO8g32diCC98CVc4U7AutgX5LboruKb4OL0BN8GDK9ZTntedl/B/j5wQ5aDfMEtuf3Cf8HLoICyOgryT34rookAaSgnWjc8NzbNlCjDKIduzk80xIRekjNoWJREgG6m/U27eMkqLdyOlD3S4L76fSIlQuuOCG2nIOZc//Z64n9eIzHt7WbKZJwYkPTroXbCsYlwLzbcYgqo4R0LhCpm/4rpOVGEGhtuzobg/V75L1TXS95Gaf14s1DezeIYQwtoERWRh7ZQGR2gI1RBFN2hB/SMXpx759F5dd6/WgecbGYe/Sjn4xPdWaSL</latexit>
1
<latexit sha1_base64="1888QJ1iSX/hhV6ImuBb1q1z9cU=">AAACKXicbVDLSgNBEJz1GeMr6tHLYBASDGE3CnoRgl48iEQxJpANy+xkNhky+2CmVxKW/R0v/ooXBUW9+iNOHgc1FjQUVd10d7mR4ApM88OYm19YXFrOrGRX19Y3NnNb23cqjCVldRqKUDZdopjgAasDB8GakWTEdwVruP3zkd+4Z1LxMLiFYcTaPukG3OOUgJacXNUGNoBEhEql+BTbniQ0sdLkKrVV7DscXxa8wsDhJdwolvDQ4UV8gG2hF3QIvik0ik4ub5bNMfAssaYkj6aoObkXuxPS2GcBUEGUallmBO2ESOBUsDRrx4pFhPZJl7U0DYjPVDsZf5rifa10sBdKXQHgsfpzIiG+UkPf1Z0+gZ76643E/7xWDN5JO+FBFAML6GSRFwsMIR7FhjtcMgpiqAmhkutbMe0RHRbocLM6BOvvy7PkrlK2DsuV66N89WwaRwbtoj1UQBY6RlV0gWqojih6QE/oFb0Zj8az8W58TlrnjOnMDvoF4+sbEDWkjA==</latexit>
<latexit sha1_base64="AMN4RntgoyQPXIG4f0tq5dqZud4=">AAADCnicfZJPb9MwGMad8G+EP+vgyOUVFVMroEpSJBAS0iQ4cBxoXSfVIXIcp7PmOMF2oFWUMxe+ChcOIMSVT8CNb4PTBTTWsVey9NP7Ps4TP3ZSCq6N7/9y3AsXL12+snHVu3b9xs3N3tatfV1UirIJLUShDhKimeCSTQw3gh2UipE8EWyaHD1v59N3TGleyD2zLFmUk7nkGafE2Fa85YCHEzbnstbWzjQeNmxhalFo3cA2PAOcKULroKnDBmYDnJPFwH8A7+PgzR4s4gAeWg47vg/4BROGDFv6qxyfpxwCxh6cqG3AbyuSWsWaWbj6xLjjs83C85TD6P9uWNjQUgKvB9Ohh5lM/wQS9/r+yF8VrEPQQR91tRv3fuK0oFXOpKGCaD0L/NJENVGGU8FswpVmJaFHZM5mFiXJmY7q1VU2cM92UsgKZZc0sOqe3FGTXOtlnlhlTsyhPj1rm2fNZpXJnkQ1l2VlmKTHRlklwBTQvgtIuWLUiKUFQhW3/wr0kNi7N/b1tCEEp4+8DvvhKBiPwleP+jtPuzg20B10Fw1QgB6jHfQS7aIJos4H55PzxfnqfnQ/u9/c78dS1+n23Eb/lPvjN5Ig3+s=</latexit>
Corresponde a los pesos de la clase verdadera, y_1=2 + R(W )
❖ gradiente descendente W = W ↵rW loss Notar que se escala la imagen <latexit sha1_base64="JmTgHAJCX7nHSmXGp6T1N7gT6BY=">AAACDXicbVA9SwNBEN3zM8avqKXNYhRsDHdR0EYI2lhGMLlALoS5zSZZsrd37M6J4cgfsPGv2FgoYmtv579x81H49WDg8d4MM/PCRAqDrvvpzM0vLC4t51byq2vrG5uFre26iVPNeI3FMtaNEAyXQvEaCpS8kWgOUSi5Hw4ux75/y7URsbrBYcJbEfSU6AoGaKV2Yd+n59SnRzQAmfSBBgpCCe3MHwXI7zCTsTGjdqHoltwJ6F/izUiRzFBtFz6CTszSiCtkEoxpem6CrQw0Cib5KB+khifABtDjTUsVRNy0ssk3I3pglQ7txtqWQjpRv09kEBkzjELbGQH2zW9vLP7nNVPsnrUyoZIUuWLTRd1UUozpOBraEZozlENLgGlhb6WsDxoY2gDzNgTv98t/Sb1c8o5L5euTYuViFkeO7JI9ckg8ckoq5IpUSY0wck8eyTN5cR6cJ+fVeZu2zjmzmR3yA877FzCNmxM=</latexit>
90 =
<latexit sha1_base64="MWbL6R2hZsQThSAdMNvF0orSXwY=">AAAB6HicbVDLSgNBEOyNrxhfUY9eBoPgKexGQS9C0IvHBMwDkiXMTnqTMbOzy8ysEEK+wIsHRbz6Sd78GyfJHjSxoKGo6qa7K0gE18Z1v53c2vrG5lZ+u7Czu7d/UDw8auo4VQwbLBaxagdUo+ASG4Ybge1EIY0Cga1gdDfzW0+oNI/lgxkn6Ed0IHnIGTVWqt/0iiW37M5BVomXkRJkqPWKX91+zNIIpWGCat3x3MT4E6oMZwKnhW6qMaFsRAfYsVTSCLU/mR86JWdW6ZMwVrakIXP198SERlqPo8B2RtQM9bI3E//zOqkJr/0Jl0lqULLFojAVxMRk9jXpc4XMiLEllClubyVsSBVlxmZTsCF4yy+vkmal7F2UK/XLUvU2iyMPJ3AK5+DBFVThHmrQAAYIz/AKb86j8+K8Ox+L1pyTzRzDHzifP44bjMU=</latexit>
X
<latexit sha1_base64="yxUgNFppSsebkUqo0HdMiZJUGss=">AAAB6HicbVBNS8NAEJ34WetX1aOXxSJ4KkkV9Fj04rEF+wFtKJvtpF272YTdjVBCf4EXD4p49Sd589+4bXPQ1gcDj/dmmJkXJIJr47rfztr6xubWdmGnuLu3f3BYOjpu6ThVDJssFrHqBFSj4BKbhhuBnUQhjQKB7WB8N/PbT6g0j+WDmSToR3QoecgZNVZqtPulsltx5yCrxMtJGXLU+6Wv3iBmaYTSMEG17npuYvyMKsOZwGmxl2pMKBvTIXYtlTRC7WfzQ6fk3CoDEsbKljRkrv6eyGik9SQKbGdEzUgvezPxP6+bmvDGz7hMUoOSLRaFqSAmJrOvyYArZEZMLKFMcXsrYSOqKDM2m6INwVt+eZW0qhXvslJtXJVrt3kcBTiFM7gAD66hBvdQhyYwQHiGV3hzHp0X5935WLSuOfnMCfyB8/kDtYOM3w==</latexit>
L= )
<latexit sha1_base64="ah7xrA2DAle2RF4ogo7uZLjA5ts=">AAACKXicbZDLSgMxFIYz3q23qks3wSJU1DKjgm6Eoi5cuFCwF+jUIZOeajTJjElGLUNfx42v4kZBUbe+iGmdhbcDgS//fw7J+cOYM21c980ZGBwaHhkdG89NTE5Nz+Rn56o6ShSFCo14pOoh0cCZhIphhkM9VkBEyKEWXu71/No1KM0ieWI6MTQFOZOszSgxVgry5UO8g32diCC98CVc4U7AutgX5LboruKb4OL0BN8GDK9ZTntedl/B/j5wQ5aDfMEtuf3Cf8HLoICyOgryT34rookAaSgnWjc8NzbNlCjDKIduzk80xIRekjNoWJREgG6m/U27eMkqLdyOlD3S4L76fSIlQuuOCG2nIOZc//Z64n9eIzHt7WbKZJwYkPTroXbCsYlwLzbcYgqo4R0LhCpm/4rpOVGEGhtuzobg/V75L1TXS95Gaf14s1DezeIYQwtoERWRh7ZQGR2gI1RBFN2hB/SMXpx759F5dd6/WgecbGYe/Sjn4xPdWaSL</latexit>
j6=yi
0.2 1.0 0.0 … 0.0 1 0.2 cat
123 =
<latexit sha1_base64="MWbL6R2hZsQThSAdMNvF0orSXwY=">AAAB6HicbVDLSgNBEOyNrxhfUY9eBoPgKexGQS9C0IvHBMwDkiXMTnqTMbOzy8ysEEK+wIsHRbz6Sd78GyfJHjSxoKGo6qa7K0gE18Z1v53c2vrG5lZ+u7Czu7d/UDw8auo4VQwbLBaxagdUo+ASG4Ybge1EIY0Cga1gdDfzW0+oNI/lgxkn6Ed0IHnIGTVWqt/0iiW37M5BVomXkRJkqPWKX91+zNIIpWGCat3x3MT4E6oMZwKnhW6qMaFsRAfYsVTSCLU/mR86JWdW6ZMwVrakIXP198SERlqPo8B2RtQM9bI3E//zOqkJr/0Jl0lqULLFojAVxMRk9jXpc4XMiLEllClubyVsSBVlxmZTsCF4yy+vkmal7F2UK/XLUvU2iyMPJ3AK5+DBFVThHmrQAAYIz/AKb86j8+K8Ox+L1pyTzRzDHzifP44bjMU=</latexit>
0.3 dog
2 -0.7 30 … 30 … 2 frog
<latexit sha1_base64="eKuMw87scmkEmwqh07asQ0COg7k=">AAACFXicbZDLSsNAFIYnXmu9RV26GSxCBSlJFXQjFN24cFHBXqAJYTKdtNNOLsxM1BLyEm58FTcuFHEruPNtnLQBtfWHgY//nDMz53cjRoU0jC9tbn5hcWm5sFJcXVvf2NS3tpsijDkmDRyykLddJAijAWlIKhlpR5wg32Wk5Q4vsnrrlnBBw+BGjiJi+6gXUI9iJJXl6IeWxxFOrAhxSRGDV+kP3zkJHaQpPIPle4ceOANHLxkVYyw4C2YOJZCr7uifVjfEsU8CiRkSomMakbST7H7MSFq0YkEihIeoRzoKA+QTYSfjrVK4r5wu9EKuTiDh2P09kSBfiJHvqk4fyb6YrmXmf7VOLL1TO6FBFEsS4MlDXsygDGEWEexSTrBkIwUIc6r+CnEfqZikCrKoQjCnV56FZrViHlWq18el2nkeRwHsgj1QBiY4ATVwCeqgATB4AE/gBbxqj9qz9qa9T1rntHxmB/yR9vENWR+e5Q==</latexit>
@wij
(rW L)yi = I(wjT xi wyTi xi + )xi
<latexit sha1_base64="3wHiXlh8X1hUNUQicsTVKoyr8zs=">AAACRnicbVBNb9NAEB2HrxI+GuDIZUWElAoR2QUJLkgVcKBSD0VqmkqxWY03k3bb9drsrimR5V/HhTO3/oReeihCvXad+AAtT1rpzZt5mp2XFkpaF4YnQefGzVu376zc7d67/+Dhau/R412bl0bQSOQqN3spWlJS08hJp2ivMIRZqmicHn1o+uNvZKzM9Y6bF5RkuK/lTAp0XuK9ZBBrTBXyalyzrTVezbms2Tv2ksW2zHh1GGv6yhZinKE7SNNqs2aDY374ZYd959IPHi9Nbf2CxR9JOVxrKt7rh8NwAXadRC3pQ4tt3vsVT3NRZqSdUGjtJAoLl1RonBSK6m5cWipQHOE+TTzVmJFNqkUMNXvulSmb5cY/7dhC/dtRYWbtPEv9ZHOKvdprxP/1JqWbvU0qqYvSkRbLRbNSMZezJlM2lYaEU3NPUBjp/8rEARoUziff9SFEV0++TnbXh9Gr4frn1/2N920cK/AUnsEAIngDG/AJtmEEAn7AKZzD7+BncBb8CS6Wo52g9TyBf9CBS65tr3k=</latexit>
j6=yi
❖ mini-batch = 1
❖ Es común que se diga SGD cuando en realidad es BGD
2 # ------ Naive SGD implementation
3 tol = 1e-3
4 delta = np.inf
5 while delta > tol:
6 data_batch = sample_data(training_data, batch_size)
7 old = loss_fun(data_batch, weights)
8 w_grads = evaluate_gradient(loss_fun, data_batch, weights)
9 weights += - step_size * w_grads
10 delta = np.abs(old - loss_fun(data_batch, weights))
Recordemos
❖ Relación entre distintas técnicas Salida
de AI
Mapeo de
Salida Salida
caracterísiticas