<html><head></head><body style="word-wrap: break-word; -webkit-nbsp-mode: space; -webkit-line-break: after-white-space; ">OK here are some more numbers for the latest patch in gerrit. I will follow Ruperts format as it's the most clear.<div><br></div><div>MeanSquares:</div><div><div>Threads<span class="Apple-tab-span" style="white-space: pre; ">        </span>3.2<span class="Apple-tab-span" style="white-space: pre; ">                </span>4.2<span class="Apple-tab-span" style="white-space: pre; ">                </span>4.2+patch<span class="Apple-tab-span" style="white-space: pre; ">        </span>patch percentage of 3.20</div><div>1<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3615<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.8214<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.4071<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>113%</div><div>2<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3222<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.6055<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3365<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>104%</div><div>4<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3249<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.4448<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3293<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>101%</div><div>8<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1703<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3093<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1943<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>114%</div><div>12<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1457<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.2031<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1322<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>91%</div><div>24*<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1062<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1332<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0949<span class="Apple-tab-span" style="white-space: pre; ">                </span>89%</div></div><div><br></div><div>MutualInformation:</div><div><div><div>Threads<span class="Apple-tab-span" style="white-space: pre; ">        </span>3.2<span class="Apple-tab-span" style="white-space: pre; ">                </span>4.2<span class="Apple-tab-span" style="white-space: pre; ">                </span>4.2+patch<span class="Apple-tab-span" style="white-space: pre; ">        </span>patch percentage of 3.20</div><div>1<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1467<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.6103<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3353<span class="Apple-tab-span" style="white-space: pre; ">                </span>228%</div><div>2<span class="Apple-tab-span" style="white-space: pre; ">                </span>0.1036<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.3747<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1774<span class="Apple-tab-span" style="white-space: pre; ">                </span>171%</div><div>4<span class="Apple-tab-span" style="white-space: pre; ">                </span>0.0847<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.2175<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1262<span class="Apple-tab-span" style="white-space: pre; ">                </span>149%</div><div>8<span class="Apple-tab-span" style="white-space: pre; ">                </span>0.0655<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1291<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0681<span class="Apple-tab-span" style="white-space: pre; ">                </span>104%</div><div>12<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0551<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.1035<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0486<span class="Apple-tab-span" style="white-space: pre; ">                </span>88%</div><div>24*<span class="Apple-tab-span" style="white-space: pre; ">        </span><span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0460<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0829<span class="Apple-tab-span" style="white-space: pre; ">        </span>0.0526<span class="Apple-tab-span" style="white-space: pre; ">                </span>114%</div></div></div><div><br></div><div>*Hyperthreading</div><div><div><br></div><div>The observation to be made about MutualInformation is that while 4.2 it's still slower with one thread, there is a significant increase is speed-up due to threads now.</div><div><br></div><div>Brad</div></div><div><br></div><div><div>On Jul 26, 2012, at 2:02 PM, Rupert Brooks wrote:</div><br class="Apple-interchange-newline"><blockquote type="cite">Ok that makes way more sense, sorry i didnt understand first time around.<div><br></div><div>Just so i've got it right<div>Threads &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;3.20 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;4.2+patch &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;Time 4.2 as percent of 3.20</div>
<div><div>1 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; 0.347567 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;0.383342 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;110.293%</div><div>2 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; 0.300869 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;0.335328 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;111.453</div><div>4 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; 0.348677 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;0.315688 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; 90.5388</div>
<div>8 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; 0.182681 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;0.192132 &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;105.173</div></div><div><br></div><div>So theres about 10% more time with ITK 4.2 used in the 1 and 2 thread case. &nbsp;That is definitely better than what we were getting. &nbsp;Cool.</div>
<div><br></div><div>Rupert</div><div><br></div><div>--------------------------------------------------------------<br>Rupert Brooks<br><a href="mailto:rupert.brooks@gmail.com">rupert.brooks@gmail.com</a><br><br>
<br><br><div class="gmail_quote">On Thu, Jul 26, 2012 at 1:13 PM, Bradley Lowekamp <span dir="ltr">&lt;<a href="mailto:blowekamp@mail.nih.gov" target="_blank">blowekamp@mail.nih.gov</a>&gt;</span> wrote:<br><blockquote class="gmail_quote" style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0.8ex; border-left-width: 1px; border-left-color: rgb(204, 204, 204); border-left-style: solid; padding-left: 1ex; position: static; z-index: auto; ">
<div style="word-wrap:break-word">Sorry for not being clear! I got too excited by finding the solution to the performance issue with ITKv3 registration in ITKv4.<div><br></div><div>This first is vanilla 3.20, the second is 4.20+ the gerrit patch. The third is the gerrit patch with the pre-malloc of the Jacobin outside the threaded section!&nbsp;Vanilla 4.2 is ~2x 3.20 for this test on my system too.<div>
<br></div><div>Summary for the MeansSquares metric in your test:</div><div><br></div><div>3.20: &nbsp;1X</div><div>4.2: 2+X</div><div>4.2+gerrit patch: 1X</div><div>4.2+gerrit patch + single-threaded preallocation of jacobian: 1.5X<br>
</div></div></div></blockquote></div></div></div></blockquote></div><br><div>
<span class="Apple-style-span" style="border-collapse: separate; color: rgb(0, 0, 0); font-family: Helvetica; font-style: normal; font-variant: normal; font-weight: normal; letter-spacing: normal; line-height: normal; orphans: 2; text-align: -webkit-auto; text-indent: 0px; text-transform: none; white-space: normal; widows: 2; word-spacing: 0px; -webkit-border-horizontal-spacing: 0px; -webkit-border-vertical-spacing: 0px; -webkit-text-decorations-in-effect: none; -webkit-text-size-adjust: auto; -webkit-text-stroke-width: 0px; font-size: medium; "><span class="Apple-style-span" style="border-collapse: separate; -webkit-border-horizontal-spacing: 0px; -webkit-border-vertical-spacing: 0px; color: rgb(0, 0, 0); font-family: Helvetica; font-size: 12px; font-style: normal; font-variant: normal; font-weight: normal; letter-spacing: normal; line-height: normal; -webkit-text-decorations-in-effect: none; text-indent: 0px; -webkit-text-size-adjust: auto; text-transform: none; orphans: 2; white-space: normal; widows: 2; word-spacing: 0px; "><div style="word-wrap: break-word; -webkit-nbsp-mode: space; -webkit-line-break: after-white-space; "><span class="Apple-style-span" style="border-collapse: separate; -webkit-border-horizontal-spacing: 0px; -webkit-border-vertical-spacing: 0px; color: rgb(0, 0, 0); font-family: Helvetica; font-size: 12px; font-style: normal; font-variant: normal; font-weight: normal; letter-spacing: normal; line-height: normal; -webkit-text-decorations-in-effect: none; text-indent: 0px; -webkit-text-size-adjust: auto; text-transform: none; orphans: 2; white-space: normal; widows: 2; word-spacing: 0px; "><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; ">========================================================</font></p><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; ">Bradley Lowekamp<span class="Apple-converted-space">&nbsp;</span><span class="Apple-converted-space">&nbsp;</span></font></p><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; ">Medical Science and Computing for</font></p><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; ">Office of High Performance Computing and Communications</font></p><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; ">National Library of Medicine<span class="Apple-converted-space">&nbsp;</span></font></p><p style="margin-top: 0px; margin-right: 0px; margin-bottom: 0px; margin-left: 0px; "><font face="Helvetica" size="3" style="font: normal normal normal 12px/normal Helvetica; "><a href="mailto:blowekamp@mail.nih.gov">blowekamp@mail.nih.gov</a></font></p><br class="Apple-interchange-newline"></span></div></span></span><br class="Apple-interchange-newline">
</div>
<br></body></html>