Local SGD for non-i.i.d. data
Konstantin Mishchenko
Work done together with Ahmed Khaled and Peter Richtárik
Local SGD for non-i.i.d. data Konstantin Mishchenko Work done - - PowerPoint PPT Presentation
Local SGD for non-i.i.d. data Konstantin Mishchenko Work done together with Ahmed Khaled and Peter Richtrik <latexit
Work done together with Ahmed Khaled and Peter Richtárik
x
M
m=1
x
M
m=1
x
M
m=1
x
M
m=1
t+1 =
t γrfm(xm t ; ξm t ), otherwise
<latexit sha1_base64="TU3D7h/GIHQvE30NZkRDc74gSRE=">ACenicbVHbatAEF2pt9S9ueljKQwxbROSGCkNJBACoX3JYwp1ErBcsVqN7CW7K7E7Sm2EP6K/lrd+SV/60LWtQpt0YOHMOXPbmaxS0lEU/QjCe/cfPHy09rjz5Omz5y+6L9fPXVlbgQNRqtJeZtyhkgYHJEnhZWR60zhRXb1aFfXKN1sjRfaFbhSPOxkYUnDyVdr9P04a24/lXDceQZDiWphG+npt3kgknaOWdhHBKjSxgDgQrB3SZe/f0OEoS6ExT8jV2IRlzrTkhmeKQ5HqzaVyBMlULsDWzp/0kiZov0mH4Huhydu+abcX9aOlwV0Qt6DHWjtLuzdJXopaoyGhuHPDOKpo1HBLUij0tWuHFRdXfIxDw3X6EbNcnVzeOuZHIrS+mcIluzfGQ3Xzs105iM1p4m7rS3I/2nDmorDUSNVRMasWpU1AqohMUdIJcWBamZB1xY6WcFMeGWC/LX6vglxLe/fBec7/XjD/29z/u9k4/tOtbYa7bBNlnMDtgJO2VnbMAE+xm8Cd4F74Nf4Ua4FW6vQsOgzXnF/rFw/zcCfb63</latexit>x
M
m=1
t+1 =
1 M
j=1(xj t γrfj(xj t; ξj t )), if t mod H = 0
t γrfm(xm t ; ξm t ), otherwise
<latexit sha1_base64="lgA18Epjy9RAdJcl5dGIGQd9cg=">ACsXicbVFda9swFJW9ry7SrfHvVwWBg3rgt0OVhiBsr30pdB03bEjicrcqLEko10vSUI/789723/ZnLiwtb2guDo3HuOru5Ny1wYDI/n/v/oOHj3Yed548fb8RXf35YUpKs34iBV5oa9SanguFB+hwJxflZpTmeb8Ml1+afKXP7g2olDnuC5LOlMiUwio5Kur9WicV3YT2RMIQo5TOhLHN+pu5EmabMhrU9rSNTycQuhq7uFPZWCU4W8B6iGZWSQqRomlPIksU28wmilWhAv78fIV+hFRnUgLC9gCym7noyDKIOo1C3uElN17y2kv296/lBc65/ikMB9ciV9O23aTbCwbBJuA2CFvQI2cJd3f0bRgleQKWU6NGYdBibGlGgXLufOuDC8pW9IZHzuoqOQmtpuJ1/DWMVPICu2OQtiw/yoslcasZeoqJcW5uZlryLty4wqzo9gKVbIFds+lFU5YAHN+mAqNGeYrx2gTAvXK7A5dYtCt+SOG0J48u3wcXBIDwcHz90Dv+3I5jh7wmb8geCclHckxOyBkZEeYNvHMv9ib+of/N/+6n21LfazWvyH/hL/8CRMjSKA=</latexit>x
M
m=1
xm
t+1 =
( ˆ xt+1, if t mod H = 0 xm
t γrfm(xm t ; ξm t ), otherwise
<latexit sha1_base64="TU3D7h/GIHQvE30NZkRDc74gSRE=">ACenicbVHbatAEF2pt9S9ueljKQwxbROSGCkNJBACoX3JYwp1ErBcsVqN7CW7K7E7Sm2EP6K/lrd+SV/60LWtQpt0YOHMOXPbmaxS0lEU/QjCe/cfPHy09rjz5Omz5y+6L9fPXVlbgQNRqtJeZtyhkgYHJEnhZWR60zhRXb1aFfXKN1sjRfaFbhSPOxkYUnDyVdr9P04a24/lXDceQZDiWphG+npt3kgknaOWdhHBKjSxgDgQrB3SZe/f0OEoS6ExT8jV2IRlzrTkhmeKQ5HqzaVyBMlULsDWzp/0kiZov0mH4Huhydu+abcX9aOlwV0Qt6DHWjtLuzdJXopaoyGhuHPDOKpo1HBLUij0tWuHFRdXfIxDw3X6EbNcnVzeOuZHIrS+mcIluzfGQ3Xzs105iM1p4m7rS3I/2nDmorDUSNVRMasWpU1AqohMUdIJcWBamZB1xY6WcFMeGWC/LX6vglxLe/fBec7/XjD/29z/u9k4/tOtbYa7bBNlnMDtgJO2VnbMAE+xm8Cd4F74Nf4Ua4FW6vQsOgzXnF/rFw/zcCfb63</latexit>t+1 = xm t γrfm(xm t )
<latexit sha1_base64="/Ss/hIUrOmuSuaZw6WP6qfoGsY=">ACFXicbVBNSwMxEM36WetX1aOXYBEUteyqoBeh6MWjglWhrctsmq2hSXZJZsWy9E948a948aCIV8Gb/8a09uDXg2Ee782QzItSKSz6/oc3Mjo2PjFZmCpOz8zOzZcWFs9tkhnGayRibmMwHIpNK+hQMkvU8NBRZJfRJ2jvn9xw40ViT7DbsqbCtpaxIBOiksbd6GOW4EvStFD+htiK5v0UYblALa0BJoHGo1gbOelgq+xV/APqXBENSJkOchKX3RithmeIamQRr64GfYjMHg4J3is2MstTYB1o87qjGhS3zXxwVY+uOqVF48S40kgH6veNHJS1XRW5SQV4bX97fE/r5hvN/MhU4z5Jp9PRnkmJC+xHRljCcoew6AswI91fKrsEAQxdk0YUQ/D75LznfrgQ7le3T3XL1cBhHgSyTFbJGArJHquSYnJAaYeSOPJAn8uzde4/ei/f6NTriDXeWyA94b5/fPZ1j</latexit>f def
M
m=1
t+1 = xm t γrfm(xm t )
<latexit sha1_base64="/Ss/hIUrOmuSuaZw6WP6qfoGsY=">ACFXicbVBNSwMxEM36WetX1aOXYBEUteyqoBeh6MWjglWhrctsmq2hSXZJZsWy9E948a948aCIV8Gb/8a09uDXg2Ee782QzItSKSz6/oc3Mjo2PjFZmCpOz8zOzZcWFs9tkhnGayRibmMwHIpNK+hQMkvU8NBRZJfRJ2jvn9xw40ViT7DbsqbCtpaxIBOiksbd6GOW4EvStFD+htiK5v0UYblALa0BJoHGo1gbOelgq+xV/APqXBENSJkOchKX3RithmeIamQRr64GfYjMHg4J3is2MstTYB1o87qjGhS3zXxwVY+uOqVF48S40kgH6veNHJS1XRW5SQV4bX97fE/r5hvN/MhU4z5Jp9PRnkmJC+xHRljCcoew6AswI91fKrsEAQxdk0YUQ/D75LznfrgQ7le3T3XL1cBhHgSyTFbJGArJHquSYnJAaYeSOPJAn8uzde4/ei/f6NTriDXeWyA94b5/fPZ1j</latexit>t+1 = xm t γrfm(xm t )
<latexit sha1_base64="/Ss/hIUrOmuSuaZw6WP6qfoGsY=">ACFXicbVBNSwMxEM36WetX1aOXYBEUteyqoBeh6MWjglWhrctsmq2hSXZJZsWy9E948a948aCIV8Gb/8a09uDXg2Ee782QzItSKSz6/oc3Mjo2PjFZmCpOz8zOzZcWFs9tkhnGayRibmMwHIpNK+hQMkvU8NBRZJfRJ2jvn9xw40ViT7DbsqbCtpaxIBOiksbd6GOW4EvStFD+htiK5v0UYblALa0BJoHGo1gbOelgq+xV/APqXBENSJkOchKX3RithmeIamQRr64GfYjMHg4J3is2MstTYB1o87qjGhS3zXxwVY+uOqVF48S40kgH6veNHJS1XRW5SQV4bX97fE/r5hvN/MhU4z5Jp9PRnkmJC+xHRljCcoew6AswI91fKrsEAQxdk0YUQ/D75LznfrgQ7le3T3XL1cBhHgSyTFbJGArJHquSYnJAaYeSOPJAn8uzde4/ei/f6NTriDXeWyA94b5/fPZ1j</latexit>def
M
m=1
t
<latexit sha1_base64="lsPe/03Qr5ovpF4QY82tokgmabo=">ACJ3icbVBS9xAGJ1Ybe2q7VqPvQwugqclWQV7UcRevAgWuipsmEy+2V3cCYJM1+Ky5B/46V/pZeCiuix/6STNQdfTDweO9fPO9pJDCoO8/egvFpfef1j+2FpZXfv0ub3+5czkpebQ57nM9UXCDEiRQR8FSrgoNDCVSDhPLr/X/vkv0Ebk2U+cFhApNs5EKjhDJ8Xtg3DCkF7FSMO8zgHaEOEK7QjSqrL7FQ1TzbgNKntShaZUsVX7QTU8qWeGKm53/K4/A31NgoZ0SIPTuH0TjnJeKsiQS2bMIPALjCzTKLiEqhWBgrGL9kYBo5mTIGJ7OzOim45ZUTXLuXIZ2pzycsU8ZMVeKSiuHEzHu1+JY3KDH9FlmRFSVCxp8WpaWkmNO6NDoSGjKqSOMa+H+SvmEuV7QVdZyJQTzJ78mZ71usNPt/djtHB41dSyTr2STbJOA7JFDckxOSZ9wck3+kFty5/32/nr3sNTdMFrZjbIC3j/gNAc6di</latexit>t+1 = xm t γrfm(xm t )
<latexit sha1_base64="/Ss/hIUrOmuSuaZw6WP6qfoGsY=">ACFXicbVBNSwMxEM36WetX1aOXYBEUteyqoBeh6MWjglWhrctsmq2hSXZJZsWy9E948a948aCIV8Gb/8a09uDXg2Ee782QzItSKSz6/oc3Mjo2PjFZmCpOz8zOzZcWFs9tkhnGayRibmMwHIpNK+hQMkvU8NBRZJfRJ2jvn9xw40ViT7DbsqbCtpaxIBOiksbd6GOW4EvStFD+htiK5v0UYblALa0BJoHGo1gbOelgq+xV/APqXBENSJkOchKX3RithmeIamQRr64GfYjMHg4J3is2MstTYB1o87qjGhS3zXxwVY+uOqVF48S40kgH6veNHJS1XRW5SQV4bX97fE/r5hvN/MhU4z5Jp9PRnkmJC+xHRljCcoew6AswI91fKrsEAQxdk0YUQ/D75LznfrgQ7le3T3XL1cBhHgSyTFbJGArJHquSYnJAaYeSOPJAn8uzde4/ei/f6NTriDXeWyA94b5/fPZ1j</latexit>def
M
m=1
t ˆ
def
M
m=1
t
<latexit sha1_base64="lsPe/03Qr5ovpF4QY82tokgmabo=">ACJ3icbVBS9xAGJ1Ybe2q7VqPvQwugqclWQV7UcRevAgWuipsmEy+2V3cCYJM1+Ky5B/46V/pZeCiuix/6STNQdfTDweO9fPO9pJDCoO8/egvFpfef1j+2FpZXfv0ub3+5czkpebQ57nM9UXCDEiRQR8FSrgoNDCVSDhPLr/X/vkv0Ebk2U+cFhApNs5EKjhDJ8Xtg3DCkF7FSMO8zgHaEOEK7QjSqrL7FQ1TzbgNKntShaZUsVX7QTU8qWeGKm53/K4/A31NgoZ0SIPTuH0TjnJeKsiQS2bMIPALjCzTKLiEqhWBgrGL9kYBo5mTIGJ7OzOim45ZUTXLuXIZ2pzycsU8ZMVeKSiuHEzHu1+JY3KDH9FlmRFSVCxp8WpaWkmNO6NDoSGjKqSOMa+H+SvmEuV7QVdZyJQTzJ78mZ71usNPt/djtHB41dSyTr2STbJOA7JFDckxOSZ9wck3+kFty5/32/nr3sNTdMFrZjbIC3j/gNAc6di</latexit>def
M
m=1
t )
<latexit sha1_base64="u6d56ApFiGX4woHMZucYOmcywxk=">ACLnicbVBNSyQxFEyr6+qsq7N69BIcFvQydKvgXgRBC+CgqPC9NikM6/HYJukteLQ+hf5MW/ogdBRbz6M8yMc/CrIFBU1ePlVpIYTEM74Ox8Ykfkz+npmu/Zn7PztX/zB/bvDQcWjyXuTlNmQUpNLRQoITwgBTqYST9GJn4J/8B2NFro+wX0BHsZ4WmeAMvZTUd3sJ0jgfRABdjHCJrgtZVbnNisaZYdxFlduvYluqxKnNqDrbp7FmqWQ0S9TyZYJnaiWpN8JmOAT9SqIRaZARDpL6bdzNealAI5fM2nYUFthxzKDgEqpaXFoGL9gPWh7qpkC23HDcyv61ytdmuXGP410qL6fcExZ21epTyqG5/azNxC/89olZv86TuiRND8bVFWSo5HXRHu8IAR9n3hHEj/F8pP2e+I/T1XwJ0eTv5Lj1Wa01lw9XG9sbY/qmCKLZIksk4hskC2yRw5Ii3ByRW7IA3kMroO74Cl4fouOBaOZBfIBwcsrVTCp2w=</latexit>Choose H such that H
√ T √ M , then γ = √ M 4L √ T 1 4HL, and hence
f(ˆ xT ) f(x∗) 8Lkx0 x∗k2 p MT + 3Mσ2
fH2
2LT . To get a convergence rate of 1/ p MT we can choose H = O(T 1/4M −3/4), which implies a total number of Ω(T 3/4M 3/4) communication steps. If a rate of 1/ p T is desired instead, we can choose a larger H = O(T 1/4).
<latexit sha1_base64="YC/RF8b/Ff3DJwq81jzCNEnsZsg=">AECnicbVNLb9NAEHYTHiW8WjhyGVGDGmjTOKlEL5UqeglSqxYpfUh1Eq3XY2dV7zr1rmkq12cu/BUuHECIK7+AG/+GcWJVbcpIlsYz38x8+2uN4qENs3m37lK9c7de/fnH9QePnr85OnC4rNDHacJxwMeR3Fy7DGNkVB4YISJ8HiUIJNehEfe6XaRP/qEiRax6pqLEfYkC5UIBGeGQoPFCrgGxybHsaxRsjtjg065UMwQ2bA7oAb4Rm4QcJ45uqzxGTdPC+93Ty3VwiICmw3ZFIy2LwBJUC2DjtwVXi9m1PkOrBT9GDKB2rDEWpA5noYCpWxSITqT4JFRYsu0QqG+eDbh1W6Xc8eFOH19d6bhTDLseDJqUp6V72W1dkoZj/tgS2YZdYiVCyQdBvQafAtai4mzemDFD5N+Z3YwjRAMeK9IznJBNmEGIA7CdtXJIN7fhHIEzBXyqKEm4CXvL3X7mrK3nsNvPVtvk1Gnr86EgoYWkc0ZNrU1sWAQqlR4mk7bunsSQFbXtsnZaSiSkTFV5iKANjnQDPgTU4xalgpHQ4KMWCfogFKGZvzLDkHEaKlkhm7dbtQGC0vNRnNicNtxSmfJKm1/sPDH9WOeSlSGR0zrE6c5Mr2MJUbwCPOam2ocMX7KQjwhVzGJupdNrnIOryjiQxAn9CkDk+j1ioxJrS+kR0jJzFDP5org/3InqQk2eplQo9TQ2U0HBWlEokPxLsAnebiJLshPBHElbRhdFcMvZ5CBGd25dvOYavhtButj62lrfelHPWC+ultWw51jtry+pY+9aBxSufK18r3ys/ql+q36o/q7+m0MpcWfPcumHV3/8A25xABA=</latexit>t+1 = xm t γrfm(xm t ; ξm t )
<latexit sha1_base64="WcKtcLHGZxiDYbIuisgnoie8vI=">ACHnicbZBdaxNBFIZno7Yx1natl94MhkKGHbTFoVSCHrjZQrNB2TjcnYymwyZmV1mzkrCkl/iTf+KN14oInil/8bJx4WmPTDMw/uew8x5k1wKi0Hwx6s8ePhob7/6uPbk4Onhkf/suGezwjDeZnMzCABy6XQvIsCJR/khoNKJO8ns/crv/+JGysyfYOLnI8UTLRIBQN0UuxfzOMSX4XLj4pe0XmM7n5NowkoBTSkEigawa+eSRnOxgtPYrwfNYF30LoRbqJNtdWL/VzTOWKG4RibB2mEY5DgqwaBgki9rUWF5DmwGEz50qEFxOyrX6y3piVPGNM2MOxrpWv13ogRl7UIlrlMBTu2utxLv84YFpm9HpdB5gVyzUNpISlmdJUVHQvDGcqFA2BGuL9SNgUDF2iNRdCuLvyXei1muFZs3V9Xm+/28ZRJS/IS9IgIXlD2uQD6ZAuYeQz+UK+ke/erfV+H93LRWvO3Mc/Jfeb/AqHoPM=</latexit>Eξkrfm(x; ξ) rfm(x)k2 4LDfm(x, x∗) + 2σ2
<latexit sha1_base64="ckeNncuaFw0mul06bUCt3lbTM=">ACQ3icbZBNTxsxEIa9QCkNX6E9jIiQkpKG+1ukajUC+qH1AMHKjWAiMNq1vEGC9u7sr0o0ZL/1kv/QG/9A730KrioQTcqDQV7L06pkZjedNCymsC8Mfwdz8wqPFx0tPasrq2vr9Y2nhzYvDeMdlsvcHKdouRSad5xwkh8XhqNKJT9Kz9P6kcX3FiR6y9uVPCewoEWmWDoPErqJ1ShO0vT6uM4oUMB9JqTCVClqjm8C141oJXcBe26OVpDFRy2NmHD0nl4bg5fAnD5EULtiGmVgwUnsZJvRG2w6ngoYlmpkFmOkjq32k/Z6Xi2jGJ1najsHC9Co0TPJxjZaWF8jOcC73mpU3PaqaQZj2PKkD1lu/NMOpvTuRIXK2pFKfefkYnu/NoH/q3VLl73pVUIXpeOa3S7KSgkuh0mg0BeGMydH3iAzwv8V2BkaZM7HXvMhRPdPfmgO43b0uh1/3mnsvZvFsUSek03SJBHZJXvkEzkgHcLIV/KT/CZ/gm/Br+BvcHXbOhfMZp6RfxRc3wC4G62v</latexit>t+1 = xm t γrfm(xm t ; ξm t )
<latexit sha1_base64="WcKtcLHGZxiDYbIuisgnoie8vI=">ACHnicbZBdaxNBFIZno7Yx1natl94MhkKGHbTFoVSCHrjZQrNB2TjcnYymwyZmV1mzkrCkl/iTf+KN14oInil/8bJx4WmPTDMw/uew8x5k1wKi0Hwx6s8ePhob7/6uPbk4Onhkf/suGezwjDeZnMzCABy6XQvIsCJR/khoNKJO8ns/crv/+JGysyfYOLnI8UTLRIBQN0UuxfzOMSX4XLj4pe0XmM7n5NowkoBTSkEigawa+eSRnOxgtPYrwfNYF30LoRbqJNtdWL/VzTOWKG4RibB2mEY5DgqwaBgki9rUWF5DmwGEz50qEFxOyrX6y3piVPGNM2MOxrpWv13ogRl7UIlrlMBTu2utxLv84YFpm9HpdB5gVyzUNpISlmdJUVHQvDGcqFA2BGuL9SNgUDF2iNRdCuLvyXei1muFZs3V9Xm+/28ZRJS/IS9IgIXlD2uQD6ZAuYeQz+UK+ke/erfV+H93LRWvO3Mc/Jfeb/AqHoPM=</latexit>Eξkrfm(x; ξ) rfm(x)k2 4LDfm(x, x∗) + 2σ2
<latexit sha1_base64="ckeNncuaFw0mul06bUCt3lbTM=">ACQ3icbZBNTxsxEIa9QCkNX6E9jIiQkpKG+1ukajUC+qH1AMHKjWAiMNq1vEGC9u7sr0o0ZL/1kv/QG/9A730KrioQTcqDQV7L06pkZjedNCymsC8Mfwdz8wqPFx0tPasrq2vr9Y2nhzYvDeMdlsvcHKdouRSad5xwkh8XhqNKJT9Kz9P6kcX3FiR6y9uVPCewoEWmWDoPErqJ1ShO0vT6uM4oUMB9JqTCVClqjm8C141oJXcBe26OVpDFRy2NmHD0nl4bg5fAnD5EULtiGmVgwUnsZJvRG2w6ngoYlmpkFmOkjq32k/Z6Xi2jGJ1najsHC9Co0TPJxjZaWF8jOcC73mpU3PaqaQZj2PKkD1lu/NMOpvTuRIXK2pFKfefkYnu/NoH/q3VLl73pVUIXpeOa3S7KSgkuh0mg0BeGMydH3iAzwv8V2BkaZM7HXvMhRPdPfmgO43b0uh1/3mnsvZvFsUSek03SJBHZJXvkEzkgHcLIV/KT/CZ/gm/Br+BvcHXbOhfMZp6RfxRc3wC4G62v</latexit>def
M
m=1
t+1 = xm t γrfm(xm t ; ξm t )
<latexit sha1_base64="WcKtcLHGZxiDYbIuisgnoie8vI=">ACHnicbZBdaxNBFIZno7Yx1natl94MhkKGHbTFoVSCHrjZQrNB2TjcnYymwyZmV1mzkrCkl/iTf+KN14oInil/8bJx4WmPTDMw/uew8x5k1wKi0Hwx6s8ePhob7/6uPbk4Onhkf/suGezwjDeZnMzCABy6XQvIsCJR/khoNKJO8ns/crv/+JGysyfYOLnI8UTLRIBQN0UuxfzOMSX4XLj4pe0XmM7n5NowkoBTSkEigawa+eSRnOxgtPYrwfNYF30LoRbqJNtdWL/VzTOWKG4RibB2mEY5DgqwaBgki9rUWF5DmwGEz50qEFxOyrX6y3piVPGNM2MOxrpWv13ogRl7UIlrlMBTu2utxLv84YFpm9HpdB5gVyzUNpISlmdJUVHQvDGcqFA2BGuL9SNgUDF2iNRdCuLvyXei1muFZs3V9Xm+/28ZRJS/IS9IgIXlD2uQD6ZAuYeQz+UK+ke/erfV+H93LRWvO3Mc/Jfeb/AqHoPM=</latexit>Eξkrfm(x; ξ) rfm(x)k2 4LDfm(x, x∗) + 2σ2
<latexit sha1_base64="ckeNncuaFw0mul06bUCt3lbTM=">ACQ3icbZBNTxsxEIa9QCkNX6E9jIiQkpKG+1ukajUC+qH1AMHKjWAiMNq1vEGC9u7sr0o0ZL/1kv/QG/9A730KrioQTcqDQV7L06pkZjedNCymsC8Mfwdz8wqPFx0tPasrq2vr9Y2nhzYvDeMdlsvcHKdouRSad5xwkh8XhqNKJT9Kz9P6kcX3FiR6y9uVPCewoEWmWDoPErqJ1ShO0vT6uM4oUMB9JqTCVClqjm8C141oJXcBe26OVpDFRy2NmHD0nl4bg5fAnD5EULtiGmVgwUnsZJvRG2w6ngoYlmpkFmOkjq32k/Z6Xi2jGJ1najsHC9Co0TPJxjZaWF8jOcC73mpU3PaqaQZj2PKkD1lu/NMOpvTuRIXK2pFKfefkYnu/NoH/q3VLl73pVUIXpeOa3S7KSgkuh0mg0BeGMydH3iAzwv8V2BkaZM7HXvMhRPdPfmgO43b0uh1/3mnsvZvFsUSek03SJBHZJXvkEzkgHcLIV/KT/CZ/gm/Br+BvcHXbOhfMZp6RfxRc3wC4G62v</latexit>def
M
m=1
Choose H such that H ≤
p T p M , then γ = p M 8L p T ≤ 1 8HL and
Ef(ˆ xT ) − f(x⇤) ≤ 32Lkˆ
x0x∗k2 p MT
+
5σ2
dif
2L p MT + σ2
difM(H1)2
4LT
.
<latexit sha1_base64="DjE2je4R90UfzEDskAkE7Lisr2E=">ADNHicdVJbaxNBFJ5dbzXeUn305WBWSNSG3a1iX4RiEYI0UCFpC9m4zM7OJkP31p1ZaZjOj/LFH+KLCD4o4qu/wdlkDUmrBwa+Oef7zm0myGPGhW1/NcwrV69dv7Fxs3Hr9p2795qb9w95VhaEDkWZ8VxgDmNWUqHgomYHucFxUkQ06PgZK+KH32gBWdZOhCznI4TPElZxAgW2uVvGm/3plnGKVg9C3hJpiCmWOgbeDE9BS8qMJEePy2EHChVo75S1jNpClY3gQnCYZXa1RNkDuwD0vhajanivVgX1mA0xA8rwHaLC/BYhoE8o2SEbQ93YU8U/6gA1ug72f+k85alm23yn/+l2drmuZ45+/dZdQFX5a81/oZtgkwb6cFyoSGbJIqYruLjvtryr+w4c+tHtbTqdSPtfKgeouBmj4zZbdtecGl4FTgxaq7cBvfvbCjJQJTQWJMecjx87FWOJCMBJT1fBKTnNMTvCEjRMcUL5WM4fXcFj7Qkhygp9UgFz76pC4oTzWRJoZjUAvxirnP+KjUoR7YwlS/NS0JQsCkVlDCKD6gdByApKRDzTAJOC6V6BTLHemND/rFqCc3Hky+DQ7TrbXfed29p9Xa9jAz1Ej1AbOegl2kU9dICGiBgfjS/Gd+OH+cn8Zv40fy2oplFrHqA1M3/AXKwAGE=</latexit>Choose H such that H ≤
p T p M , then γ = p M 8L p T ≤ 1 8HL and
Ef(ˆ xT ) − f(x⇤) ≤ 32Lkˆ
x0x∗k2 p MT
+
5σ2
dif
2L p MT + σ2
difM(H1)2
4LT
.
<latexit sha1_base64="DjE2je4R90UfzEDskAkE7Lisr2E=">ADNHicdVJbaxNBFJ5dbzXeUn305WBWSNSG3a1iX4RiEYI0UCFpC9m4zM7OJkP31p1ZaZjOj/LFH+KLCD4o4qu/wdlkDUmrBwa+Oef7zm0myGPGhW1/NcwrV69dv7Fxs3Hr9p2795qb9w95VhaEDkWZ8VxgDmNWUqHgomYHucFxUkQ06PgZK+KH32gBWdZOhCznI4TPElZxAgW2uVvGm/3plnGKVg9C3hJpiCmWOgbeDE9BS8qMJEePy2EHChVo75S1jNpClY3gQnCYZXa1RNkDuwD0vhajanivVgX1mA0xA8rwHaLC/BYhoE8o2SEbQ93YU8U/6gA1ug72f+k85alm23yn/+l2drmuZ45+/dZdQFX5a81/oZtgkwb6cFyoSGbJIqYruLjvtryr+w4c+tHtbTqdSPtfKgeouBmj4zZbdtecGl4FTgxaq7cBvfvbCjJQJTQWJMecjx87FWOJCMBJT1fBKTnNMTvCEjRMcUL5WM4fXcFj7Qkhygp9UgFz76pC4oTzWRJoZjUAvxirnP+KjUoR7YwlS/NS0JQsCkVlDCKD6gdByApKRDzTAJOC6V6BTLHemND/rFqCc3Hky+DQ7TrbXfed29p9Xa9jAz1Ej1AbOegl2kU9dICGiBgfjS/Gd+OH+cn8Zv40fy2oplFrHqA1M3/AXKwAGE=</latexit>Choose H such that H ≤
p T p M , then γ = p M 8L p T ≤ 1 8HL and
Ef(ˆ xT ) − f(x⇤) ≤ 32Lkˆ
x0x∗k2 p MT
+
5σ2
dif
2L p MT + σ2
difM(H1)2
4LT
.
<latexit sha1_base64="DjE2je4R90UfzEDskAkE7Lisr2E=">ADNHicdVJbaxNBFJ5dbzXeUn305WBWSNSG3a1iX4RiEYI0UCFpC9m4zM7OJkP31p1ZaZjOj/LFH+KLCD4o4qu/wdlkDUmrBwa+Oef7zm0myGPGhW1/NcwrV69dv7Fxs3Hr9p2795qb9w95VhaEDkWZ8VxgDmNWUqHgomYHucFxUkQ06PgZK+KH32gBWdZOhCznI4TPElZxAgW2uVvGm/3plnGKVg9C3hJpiCmWOgbeDE9BS8qMJEePy2EHChVo75S1jNpClY3gQnCYZXa1RNkDuwD0vhajanivVgX1mA0xA8rwHaLC/BYhoE8o2SEbQ93YU8U/6gA1ug72f+k85alm23yn/+l2drmuZ45+/dZdQFX5a81/oZtgkwb6cFyoSGbJIqYruLjvtryr+w4c+tHtbTqdSPtfKgeouBmj4zZbdtecGl4FTgxaq7cBvfvbCjJQJTQWJMecjx87FWOJCMBJT1fBKTnNMTvCEjRMcUL5WM4fXcFj7Qkhygp9UgFz76pC4oTzWRJoZjUAvxirnP+KjUoR7YwlS/NS0JQsCkVlDCKD6gdByApKRDzTAJOC6V6BTLHemND/rFqCc3Hky+DQ7TrbXfed29p9Xa9jAz1Ej1AbOegl2kU9dICGiBgfjS/Gd+OH+cn8Zv40fy2oplFrHqA1M3/AXKwAGE=</latexit>x
M
m=1
Better Communication Complexity for Local SGD arXiv:1909.04746 First Analysis of Local GD on Heterogeneous Data arXiv:1909.04715 NeurIPS workshop on Federated Learning http://federated-learning.org/fl-neurips-2019/