# LaTeX2HTML 0.6.4 (Tues Aug 30 1994) # Associate image original text (scrambled) with physical files. $key = q/{figure}centerlinepsfigfigure=.code.eps,width=5.5in,height=3in{figure}/; $cached_env_img{$key} =''; $key = q/{}$infty${}/; $cached_env_img{$key} =''; $key = q/{}$X${}/; $cached_env_img{$key} =''; $key = q/{displaymath}bordermatrix;html_special_mark_amp;k;html_special_mark_amp;n-kcrk;html_special_mark_amp;A_11;html_special_mark_amp;A_12crn-k;html_special_mark_amp;0;html_special_mark_amp;A_22cr,{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$A_22${}/; $cached_env_img{$key} =''; $key = q/{table}centertabular|r|r|r|r||r|r|r|hlinebfDelta;html_special_mark_amp;multicolumn3c||$16times16$PEs;html_special_mark_amp;multicolumn3c|$16times32$PEshline$n$;html_special_mark_amp;QRtime;html_special_mark_amp;Solvetime;html_special_mark_amp;Mflops;html_special_mark_amp;QRtime;html_special_mark_amp;Solvetime;html_special_mark_amp;Mflops;html_special_mark_amp;(seconds);html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(seconds);html_special_mark_amp;(seconds);html_special_mark_amp;(total)hlinehline1000;html_special_mark_amp;4.514;html_special_mark_amp;1.0033;html_special_mark_amp;242.77;html_special_mark_amp;3.440;html_special_mark_amp;0.3975;html_special_mark_amp;348.262000;html_special_mark_amp;11.495;html_special_mark_amp;2.1829;html_special_mark_amp;781.61;html_special_mark_amp;8.381;html_special_mark_amp;0.8433;html_special_mark_amp;1157.633000;html_special_mark_amp;21.791;html_special_mark_amp;3.6266;html_special_mark_amp;1418.44;html_special_mark_amp;15.414;html_special_mark_amp;1.3375;html_special_mark_amp;2150.734000;html_special_mark_amp;36.150;html_special_mark_amp;5.3768;html_special_mark_amp;2057.21;html_special_mark_amp;24.752;html_special_mark_amp;1.8519;html_special_mark_amp;3209.405000;html_special_mark_amp;55.513;html_special_mark_amp;7.2712;html_special_mark_amp;2656.98;html_special_mark_amp;36.911;html_special_mark_amp;2.3994;html_special_mark_amp;4241.716000;html_special_mark_amp;80.682;html_special_mark_amp;9.5162;html_special_mark_amp;3195.36;html_special_mark_amp;52.452;html_special_mark_amp;3.0455;html_special_mark_amp;5191.397000;html_special_mark_amp;112.359;html_special_mark_amp;12.0318;html_special_mark_amp;3678.94;html_special_mark_amp;71.531;html_special_mark_amp;3.6736;html_special_mark_amp;6083.128000;html_special_mark_amp;151.524;html_special_mark_amp;14.7269;html_special_mark_amp;4108.54;html_special_mark_amp;94.682;html_special_mark_amp;4.3310;html_special_mark_amp;6896.669000;html_special_mark_amp;198.830;html_special_mark_amp;17.8164;html_special_mark_amp;4488.82;html_special_mark_amp;122.305;html_special_mark_amp;5.0823;html_special_mark_amp;7632.1810000;html_special_mark_amp;255.710;html_special_mark_amp;20.9755;html_special_mark_amp;4821.16;html_special_mark_amp;154.792;html_special_mark_amp;5.8376;html_special_mark_amp;8302.54hlinetabularvspace.2intabular|r|r|r||r|r|hlinebfDelta;html_special_mark_amp;multicolumn2c||$16times16$PEs;html_special_mark_amp;multicolumn2c|$16times32$PEshline$n$;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(seconds);html_special_mark_amp;(total)hlinehline1000;html_special_mark_amp;6.6254;html_special_mark_amp;201.25;html_special_mark_amp;4.6249;html_special_mark_amp;288.292000;html_special_mark_amp;18.1142;html_special_mark_amp;588.86;html_special_mark_amp;11.8456;html_special_mark_amp;900.483000;html_special_mark_amp;35.8709;html_special_mark_amp;1003.60;html_special_mark_amp;22.3526;html_special_mark_amp;1610.554000;html_special_mark_amp;62.3064;html_special_mark_amp;1369.58;html_special_mark_amp;37.2151;html_special_mark_amp;2292.985000;html_special_mark_amp;98.1878;html_special_mark_amp;1697.43;html_special_mark_amp;57.3836;html_special_mark_amp;2904.436000;html_special_mark_amp;147.1279;html_special_mark_amp;1957.48;html_special_mark_amp;83.2704;html_special_mark_amp;3458.617000;html_special_mark_amp;209.4396;html_special_mark_amp;2183.61;html_special_mark_amp;116.7009;html_special_mark_amp;3918.858000;html_special_mark_amp;286.0408;html_special_mark_amp;2386.61;html_special_mark_amp;157.7757;html_special_mark_amp;4326.829000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;207.2685;html_special_mark_amp;4689.5710000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;265.6364;html_special_mark_amp;5019.39hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{}$R${}/; $cached_env_img{$key} =''; $key = q/{}$(B^H_j,-A^H_j)^H${}/; $cached_env_img{$key} =''; $key = q/{}$A-lambdaB${}/; $cached_env_img{$key} =''; $key = q/{table}centerlinetabular|l|c|c|c|c|c|hline;html_special_mark_amp;Computation;html_special_mark_amp;multicolumn2c|CommunicationCost;html_special_mark_amp;multicolumn2c|LoadImbalanceCostcline3-6Task;html_special_mark_amp;Cost;html_special_mark_amp;latency;html_special_mark_amp;bandwidth$^-1$;html_special_mark_amp;computation;html_special_mark_amp;bandwidth$^-1$hlineLU;html_special_mark_amp;$frac23fracn^3ptdgemm$;html_special_mark_amp;$scriptstyle(6+lgp)ntlatency$;html_special_mark_amp;$scriptstyle(3+fraclgp4scriptstyle)fracn^2sqrtptband$;html_special_mark_amp;$fracbn^2sqrtptdgemm$;html_special_mark_amp;$scriptstyle(1+fraclgp4scriptstyle)bntband$hlineTRI;html_special_mark_amp;$frac43fracn^3ptdgemm$;html_special_mark_amp;$scriptstyle2ntlatency$;html_special_mark_amp;$scriptstyle(2+frac32scriptstylelgp)fracn^2sqrtptband$;html_special_mark_amp;$frac2bn^2sqrtptau_ttDGEMM$;html_special_mark_amp;$frac3bnlgp2tband$hlineparbox0.75inMatrixmultiply;html_special_mark_amp;$scriptstyle2fracn^3ptdgemm$;html_special_mark_amp;$scriptstyle(1+fraclgp2scriptstyle)sqrtptlatency$;html_special_mark_amp;$scriptstyle(1+fraclgp2scriptstyle)fracn^2sqrtptband$;html_special_mark_amp;;html_special_mark_amp;hlineQR;html_special_mark_amp;$frac43fracn^3ptdgemm$;html_special_mark_amp;$scriptstyle3nlgptau_lat$;html_special_mark_amp;$frac3lgp4fracn^2sqrtptband$;html_special_mark_amp;;html_special_mark_amp;hlineparbox0.75inHouseholderapplication;html_special_mark_amp;$scriptstyle2fracn^3ptdgemm$;html_special_mark_amp;;html_special_mark_amp;$scriptstyle2fracn^2sqrtpscriptstylelgptband$;html_special_mark_amp;;html_special_mark_amp;hlinetabular{table}/; $cached_env_img{$key} =''; $key = q/{}$(0,I)^T${}/; $cached_env_img{$key} =''; $key = q/{}$rmdet(A-lambdaB)${}/; $cached_env_img{$key} =''; $key = q/{displaymath}mboxrmsign(A)equivXleft(arrayccI;html_special_mark_amp;00;html_special_mark_amp;-Iarrayright)X^-1.{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$n;html_special_mark_lt;512${}/; $cached_env_img{$key} =''; $key = q/{}$R_1${}/; $cached_env_img{$key} =''; $key = q/{}$A_j+1=Q^H_12A_j;${}/; $cached_env_img{$key} =''; $key = q/{table}centertabular|r|r|r||r|r|hlinebfDelta;html_special_mark_amp;multicolumn2c||$16times16$PEs;html_special_mark_amp;multicolumn2c|$16times32$PEshline$n$;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(seconds);html_special_mark_amp;(total)hlinehline1000;html_special_mark_amp;0.86;html_special_mark_amp;2314.70;html_special_mark_amp;0.62;html_special_mark_amp;3237.472000;html_special_mark_amp;4.03;html_special_mark_amp;3971.61;html_special_mark_amp;2.57;html_special_mark_amp;6236.893000;html_special_mark_amp;10.57;html_special_mark_amp;5108.06;html_special_mark_amp;6.49;html_special_mark_amp;8320.184000;html_special_mark_amp;21.63;html_special_mark_amp;5918.57;html_special_mark_amp;13.61;html_special_mark_amp;9406.205000;html_special_mark_amp;40.27;html_special_mark_amp;6207.39;html_special_mark_amp;24.54;html_special_mark_amp;10187.366000;html_special_mark_amp;65.80;html_special_mark_amp;6565.66;html_special_mark_amp;39.52;html_special_mark_amp;10930.537000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;60.43;html_special_mark_amp;11352.038000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;87.96;html_special_mark_amp;11641.059000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;126.01;html_special_mark_amp;11570.10hlinetabularvspace.2intabular|r|r|r|r||r|r|r|hlinebfDelta;html_special_mark_amp;multicolumn3c||$16times16$PEs;html_special_mark_amp;multicolumn3c|$16times32$PEshline$n$;html_special_mark_amp;LUtime;html_special_mark_amp;TRItime;html_special_mark_amp;Mflops;html_special_mark_amp;LUtime;html_special_mark_amp;TRItime;html_special_mark_amp;Mflops;html_special_mark_amp;(seconds);html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(seconds);html_special_mark_amp;(seconds);html_special_mark_amp;(total)hlinehline1000;html_special_mark_amp;2.709;html_special_mark_amp;2.821;html_special_mark_amp;361.67;html_special_mark_amp;2.049;html_special_mark_amp;2.419;html_special_mark_amp;447.632000;html_special_mark_amp;6.743;html_special_mark_amp;9.337;html_special_mark_amp;995.01;html_special_mark_amp;4.990;html_special_mark_amp;7.471;html_special_mark_amp;1284.013000;html_special_mark_amp;12.472;html_special_mark_amp;20.460;html_special_mark_amp;1639.76;html_special_mark_amp;8.971;html_special_mark_amp;15.668;html_special_mark_amp;2191.664000;html_special_mark_amp;20.287;html_special_mark_amp;37.164;html_special_mark_amp;2227.98;html_special_mark_amp;14.167;html_special_mark_amp;27.431;html_special_mark_amp;3077.045000;html_special_mark_amp;30.676;html_special_mark_amp;60.773;html_special_mark_amp;2733.78;html_special_mark_amp;20.895;html_special_mark_amp;43.253;html_special_mark_amp;3897.246000;html_special_mark_amp;44.031;html_special_mark_amp;92.136;html_special_mark_amp;3172.57;html_special_mark_amp;29.258;html_special_mark_amp;64.015;html_special_mark_amp;4631.527000;html_special_mark_amp;60.771;html_special_mark_amp;132.391;html_special_mark_amp;3551.41;html_special_mark_amp;39.558;html_special_mark_amp;89.561;html_special_mark_amp;5312.958000;html_special_mark_amp;81.240;html_special_mark_amp;176.255;html_special_mark_amp;3976.78;html_special_mark_amp;51.908;html_special_mark_amp;117.107;html_special_mark_amp;6058.629000;html_special_mark_amp;106.045;html_special_mark_amp;243.910;html_special_mark_amp;4166.25;html_special_mark_amp;66.579;html_special_mark_amp;157.781;html_special_mark_amp;6498.4810000;html_special_mark_amp;135.381;html_special_mark_amp;316.825;html_special_mark_amp;4422.77;html_special_mark_amp;83.737;html_special_mark_amp;202.448;html_special_mark_amp;6988.48hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{}$tau_lat+dtband${}/; $cached_env_img{$key} =''; $key = q/{}$L${}/; $cached_env_img{$key} =''; $key = q/{}$mu${}/; $cached_env_img{$key} =''; $key = q/{}$rband${}/; $cached_env_img{$key} =''; $key = q/{}$Q_12^HB_j=Q_22^HA_j${}/; $cached_env_img{$key} =''; $key = q/{}$sqrtmboxoverflow${}/; $cached_env_img{$key} =''; $key = q/{figure}centerlinepsfigfigure=.signscale.eps,width=3inlabelsignscalpic{figure}/; $cached_env_img{$key} =''; $key = q/{}$(A_p+B_p)^-1A_p${}/; $cached_env_img{$key} =''; $key = q/{}$10${}/; $cached_env_img{$key} =''; $key = q/{}$I-P_+=P_-=frac12(I-mboxrmsign(A))${}/; $cached_env_img{$key} =''; $key = q/{}$tdgemm${}/; $cached_env_img{$key} =''; $key = q/{}$2ntimesn${}/; $cached_env_img{$key} =''; $key = q/{}$n^3${}/; $cached_env_img{$key} =''; $key = q/{}$lim_jrightarrowinftyA_j=mboxrmsign(A)${}/; $cached_env_img{$key} =''; $key = q/{}$Pi${}/; $cached_env_img{$key} =''; $key = q/{}$A_p${}/; $cached_env_img{$key} =''; $key = q/{figure}centerlinepsfigfigure=.intelblocktime.eps,width=3inpsfigfigure=.intelblockmflops.eps,width=3inlabelintelpic{figure}/; $cached_env_img{$key} =''; $key = q/{}$500times500${}/; $cached_env_img{$key} =''; $key = q/{}$sqrtmboxunderflow${}/; $cached_env_img{$key} =''; $key = q/{}$16times16${}/; $cached_env_img{$key} =''; $key = q/{figure}centerlinepsfigfigure=.allxi.eps,width=5.5in{figure}/; $cached_env_img{$key} =''; $key = q/{}$B_0=I${}/; $cached_env_img{$key} =''; $key = q/{}$2ntimes2n${}/; $cached_env_img{$key} =''; $key = q/{}$(A-I)(A+I)^-1${}/; $cached_env_img{$key} =''; $key = q/{displaymath}bordermatrix;html_special_mark_amp;260;html_special_mark_amp;240cr260;html_special_mark_amp;A_11;html_special_mark_amp;A_12cr240;html_special_mark_amp;0;html_special_mark_amp;A_22cr{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$P_+=QRPi${}/; $cached_env_img{$key} =''; $key = q/{}$(A_p+B_p)^-1${}/; $cached_env_img{$key} =''; $key = q/{}$p=j+1${}/; $cached_env_img{$key} =''; $key = q/{}$(j;html_special_mark_gt;1&|R_j-R_j-1|_1leqtau|R_j-1|_1${}/; $cached_env_img{$key} =''; $key = q/{}$P_+${}/; $cached_env_img{$key} =''; $key = q/{}$|A^2-I|;html_special_mark_lt;1${}/; $cached_env_img{$key} =''; $key = q/{}$tlatency${}/; $cached_env_img{$key} =''; $key = q/{}$|E_21|_1|A|_1${}/; $cached_env_img{$key} =''; $key = q/{figure}centerlinepsfigfigure=.circle1.eps,width=3inlabelfig_region{figure}/; $cached_env_img{$key} =''; $key = q/{}$A_0=A-muI${}/; $cached_env_img{$key} =''; $key = q/{}$ltimesl${}/; $cached_env_img{$key} =''; $key = q/{}$tau${}/; $cached_env_img{$key} =''; $key = q/{}$tband${}/; $cached_env_img{$key} =''; $key = q/{}$k${}/; $cached_env_img{$key} =''; $key = q/{}$[-1,1]${}/; $cached_env_img{$key} =''; $key = q/{}$B_j+1=Q^H_22B_j;${}/; $cached_env_img{$key} =''; $key = q/{}$(mboxrmsign(A))^2=I${}/; $cached_env_img{$key} =''; $key = q/{}$|E_21|_1|A|_1leq10^-11${}/; $cached_env_img{$key} =''; $key = q/{}$times${}/; $cached_env_img{$key} =''; $key = q/{}$A_11${}/; $cached_env_img{$key} =''; $key = q/{}$left(arrayrB_j-A_jarrayright)=left(arrayccQ_11;html_special_mark_amp;Q_12Q_21;html_special_mark_amp;Q_22arrayright)left(arraycR_j0arrayright)${}/; $cached_env_img{$key} =''; $key = q/{}$Q_22${}/; $cached_env_img{$key} =''; $key = q/{}$A_j+1=frac12(A_j+A^-1_j)${}/; $cached_env_img{$key} =''; $key = q/{}$Q_12${}/; $cached_env_img{$key} =''; $key = q/{table}centertabular|r|r|r|r||r|r|r||r|r|r|hlinebfDelta;html_special_mark_amp;multicolumn3c||$8times16$PEs;html_special_mark_amp;multicolumn3c||$16times16$PEs;html_special_mark_amp;multicolumn3c|$16times32$PEshline$n$;html_special_mark_amp;iter;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;iter;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;iter;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;;html_special_mark_amp;(sec);html_special_mark_amp;(total);html_special_mark_amp;;html_special_mark_amp;(sec);html_special_mark_amp;(total);html_special_mark_amp;;html_special_mark_amp;(sec);html_special_mark_amp;(total)hlinehline1000;html_special_mark_amp;;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;18;html_special_mark_amp;134.21;html_special_mark_amp;293.05;html_special_mark_amp;19;html_special_mark_amp;110.83;html_special_mark_amp;372.942000;html_special_mark_amp;21;html_special_mark_amp;502.57;html_special_mark_amp;678.43;html_special_mark_amp;21;html_special_mark_amp;448.69;html_special_mark_amp;808.28;html_special_mark_amp;21;html_special_mark_amp;336.34;html_special_mark_amp;1978.273000;html_special_mark_amp;18;html_special_mark_amp;1037.03;html_special_mark_amp;1024.07;html_special_mark_amp;18;html_special_mark_amp;792.18;html_special_mark_amp;1340.60;html_special_mark_amp;18;html_special_mark_amp;576.68;html_special_mark_amp;1841.554000;html_special_mark_amp;;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;19;html_special_mark_amp;1436.13;html_special_mark_amp;1841.98;html_special_mark_amp;19;html_special_mark_amp;1014.63;html_special_mark_amp;2607.188000;html_special_mark_amp;;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;20;html_special_mark_amp;4268.35;html_special_mark_amp;5197.94hlinetabular~tabular|r|r|r||r|r||r|r|hlinebfDelta;html_special_mark_amp;multicolumn2c||$8times16$PEs;html_special_mark_amp;multicolumn2c||$16times16$PEs;html_special_mark_amp;multicolumn2c|$16times32$PEshline$n$;html_special_mark_amp;actual;html_special_mark_amp;predicted;html_special_mark_amp;actual;html_special_mark_amp;predicted;html_special_mark_amp;actual;html_special_mark_amp;predicted;html_special_mark_amp;time(sec);html_special_mark_amp;time(sec);html_special_mark_amp;time(sec);html_special_mark_amp;time(sec);html_special_mark_amp;time(sec);html_special_mark_amp;time(sec)hlinehline1000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;134.21;html_special_mark_amp;120.1;html_special_mark_amp;110.83;html_special_mark_amp;112.42000;html_special_mark_amp;502.57;html_special_mark_amp;444.3;html_special_mark_amp;448.69;html_special_mark_amp;362.3;html_special_mark_amp;336.34;html_special_mark_amp;310.83000;html_special_mark_amp;1037.03;html_special_mark_amp;994.7;html_special_mark_amp;792.18;html_special_mark_amp;756.8;html_special_mark_amp;576.68;html_special_mark_amp;610.44000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;1436.13;html_special_mark_amp;1334.;html_special_mark_amp;1014.63;html_special_mark_amp;1026.8000;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;4268.35;html_special_mark_amp;4152.hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{}$A^-1${}/; $cached_env_img{$key} =''; $key = q/{}$E_21${}/; $cached_env_img{$key} =''; $key = q/{}$calD${}/; $cached_env_img{$key} =''; $key = q/{}$Q^HAQ=left(arrayccA_11;html_special_mark_amp;A_12E_21;html_special_mark_amp;A_22arrayright)${}/; $cached_env_img{$key} =''; $key = q/{}$3times3${}/; $cached_env_img{$key} =''; $key = q/{}$J_+${}/; $cached_env_img{$key} =''; $key = q/{}$j=0,1,ldots${}/; $cached_env_img{$key} =''; $key = q/{table}centerlinetabular|l|l|l|l|l|hlineModel;html_special_mark_amp;;html_special_mark_amp;Performance;html_special_mark_amp;multicolumn2c|measuredvalues$mu$scline4-5Parameter;html_special_mark_amp;Description;html_special_mark_amp;limitedby;html_special_mark_amp;CM-5;html_special_mark_amp;Deltahline$tdgemm$;html_special_mark_amp;ttBLAS3;html_special_mark_amp;peakfloprate;html_special_mark_amp;190.;html_special_mark_amp;134.hline$tlatency$;html_special_mark_amp;messagelatency;html_special_mark_amp;comm.software;html_special_mark_amp;150;html_special_mark_amp;157hline$tband$;html_special_mark_amp;bandwidth$^-1$;html_special_mark_amp;comm.hardware;html_special_mark_amp;1.62;html_special_mark_amp;1.67hlinetabular{table}/; $cached_env_img{$key} =''; $key = q/{}$l=mboxtrace(P_+)=mboxrank(P_+)${}/; $cached_env_img{$key} =''; $key = q/{}$|A_j+1-A_j|_1leqtau|A_j|_1${}/; $cached_env_img{$key} =''; $key = q/{displaymath}bordermatrix;html_special_mark_amp;106;html_special_mark_amp;154;html_special_mark_amp;240cr106;html_special_mark_amp;A_11;html_special_mark_amp;A_12;html_special_mark_amp;A_13cr154;html_special_mark_amp;0;html_special_mark_amp;A_22;html_special_mark_amp;A_23cr240;html_special_mark_amp;0;html_special_mark_amp;0;html_special_mark_amp;A_33cr{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$U${}/; $cached_env_img{$key} =''; $key = q/{}$4n^2${}/; $cached_env_img{$key} =''; $key = q/{}$(A_p+B_p)^-1B_p=QRPi${}/; $cached_env_img{$key} =''; $key = q/{}$Q${}/; $cached_env_img{$key} =''; $key = q/{}$mboxrmsign(A)${}/; $cached_env_img{$key} =''; $key = q/{}$1.44times10^-13${}/; $cached_env_img{$key} =''; $key = q/{}$j_max${}/; $cached_env_img{$key} =''; $key = q/{}$l=rmrank(R)${}/; $cached_env_img{$key} =''; $key = q/{table}labelintelsignprofilecentertabular|r|r|r|r|r|hline$n$;html_special_mark_amp;Sign-Func(%);html_special_mark_amp;QRP(%);html_special_mark_amp;$Q^TAQ$(%);html_special_mark_amp;totalhlinehline1000;html_special_mark_amp;123.06(91%);html_special_mark_amp;6.87(5%);html_special_mark_amp;4.27(5%);html_special_mark_amp;134.222000;html_special_mark_amp;413.95(92%);html_special_mark_amp;18.60(4%);html_special_mark_amp;16.13(4%);html_special_mark_amp;448.693000;html_special_mark_amp;717.04(90%);html_special_mark_amp;36.76(5%);html_special_mark_amp;38.37(5%);html_special_mark_amp;792.184000;html_special_mark_amp;1300.16(90%);html_special_mark_amp;63.13(5%);html_special_mark_amp;72.80(5%);html_special_mark_amp;1436.14hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{figure}centerlinepsfigfigure=.cm5blocktime.eps,width=3inpsfigfigure=.cm5blockmflops.eps,width=3inlabelcmssl{figure}/; $cached_env_img{$key} =''; $key = q/{}$B_0=rI${}/; $cached_env_img{$key} =''; $key = q/{}$B_jA_j^-1=Q_12^-HQ_22^H${}/; $cached_env_img{$key} =''; $key = q/{}$l=mboxrank(R)${}/; $cached_env_img{$key} =''; $key = q/{}$A_33${}/; $cached_env_img{$key} =''; $key = q/{}$n=256${}/; $cached_env_img{$key} =''; $key = q/{}$|A^2_i-I|;html_special_mark_lt;1${}/; $cached_env_img{$key} =''; $key = q/{}$A${}/; $cached_env_img{$key} =''; $key = q/{}$|A_i+1-A_i|_1leqsqrtn${}/; $cached_env_img{$key} =''; $key = q/{}$B_0=B${}/; $cached_env_img{$key} =''; $key = q/{}$lat${}/; $cached_env_img{$key} =''; $key = q/{}$A_0=A${}/; $cached_env_img{$key} =''; $key = q/{}$A_0${}/; $cached_env_img{$key} =''; $key = q/{}$Q^H_1(A_p+B_p)${}/; $cached_env_img{$key} =''; $key = q/{table}centertabular|c|c|c|c|c|c|c|c|hline;html_special_mark_amp;;html_special_mark_amp;Actual;html_special_mark_amp;Predicted;html_special_mark_amp;;html_special_mark_amp;;html_special_mark_amp;GEMM-;html_special_mark_amp;Inverse-$n$;html_special_mark_amp;$|E_21|_1|A|_1$;html_special_mark_amp;Time;html_special_mark_amp;Time;html_special_mark_amp;Mflops;html_special_mark_amp;Mflops;html_special_mark_amp;Mflops;html_special_mark_amp;Mflops;html_special_mark_amp;(iter1,iter2);html_special_mark_amp;(seconds);html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode)hlinehline256;html_special_mark_amp;$4e-14$(16,2);html_special_mark_amp;25.4;html_special_mark_amp;18.9;html_special_mark_amp;0.72;html_special_mark_amp;0.96;html_special_mark_amp;12.57;html_special_mark_amp;0.69512;html_special_mark_amp;$2e-13$(16,2);html_special_mark_amp;58.6;html_special_mark_amp;50.8;html_special_mark_amp;106.88;html_special_mark_amp;3.34;html_special_mark_amp;22.14;html_special_mark_amp;2.62768;html_special_mark_amp;$2e-13$(15,2);html_special_mark_amp;99.23;html_special_mark_amp;97.1;html_special_mark_amp;203.84;html_special_mark_amp;6.37;html_special_mark_amp;30.32;html_special_mark_amp;5.051024;html_special_mark_amp;$2e-13$(14,2);html_special_mark_amp;143.92;html_special_mark_amp;159.5;html_special_mark_amp;318.40;html_special_mark_amp;9.95;html_special_mark_amp;37.71;html_special_mark_amp;7.811280;html_special_mark_amp;$3e-13$(15,2);html_special_mark_amp;231.12;html_special_mark_amp;239.6;html_special_mark_amp;405.44;html_special_mark_amp;12.67;html_special_mark_amp;42.06;html_special_mark_amp;10.641536;html_special_mark_amp;$2e-12$(14,2);html_special_mark_amp;296.99;html_special_mark_amp;338.8;html_special_mark_amp;520.64;html_special_mark_amp;16.27;html_special_mark_amp;46.61;html_special_mark_amp;13.491792;html_special_mark_amp;$7e-13$(16,1);html_special_mark_amp;423.42;html_special_mark_amp;458.9;html_special_mark_amp;579.84;html_special_mark_amp;18.12;html_special_mark_amp;51.47;html_special_mark_amp;16.162048;html_special_mark_amp;$7e-13$(14,2);html_special_mark_amp;506.11;html_special_mark_amp;601.3;html_special_mark_amp;732.16;html_special_mark_amp;22.88;html_special_mark_amp;55.72;html_special_mark_amp;18.87hlinetabularcenterlabelsigncm5{table}/; $cached_env_img{$key} =''; $key = q/{}$j;html_special_mark_gt;j_max${}/; $cached_env_img{$key} =''; $key = q/{}$ULP${}/; $cached_env_img{$key} =''; $key = q/{displaymath}A_j+1^-1B_j+1=A_j^-1Q_12^-HQ_22^HB_j=(A_j^-1B_j)^2{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$delimiter;html_special_mark_quot;26B30DE_21delimiter;html_special_mark_quot;26B30D_1delimiter;html_special_mark_quot;26B30DAdelimiter;html_special_mark_quot;26B30D_1leq10^-11${}/; $cached_env_img{$key} =''; $key = q/{}$|A^-1|_infty${}/; $cached_env_img{$key} =''; $key = q/{}$pm${}/; $cached_env_img{$key} =''; $key = q/{displaymath}left(arrayccQ_11^H;html_special_mark_amp;Q_21^HQ_12^H;html_special_mark_amp;Q_22^Harrayright)left(arraycB_j-A_jarrayright)=left(arraycQ_11^HB_j-Q_21^HA_jQ_12^HB_j-Q_22^HA_jarrayright)=left(arraycR_j0arrayright){displaymath}/; $cached_env_img{$key} =''; $key = q/{table}centerlinetabular|ll|c|c|c|c|hline;html_special_mark_amp;;html_special_mark_amp;20matrix;html_special_mark_amp;QR;html_special_mark_amp;2Householder;html_special_mark_amp;Total;html_special_mark_amp;;html_special_mark_amp;inversions;html_special_mark_amp;;html_special_mark_amp;applications;html_special_mark_amp;hlineComputationcost;html_special_mark_amp;$timesfracn^3ptdgemm$;html_special_mark_amp;$scriptstyle40$;html_special_mark_amp;$frac43$;html_special_mark_amp;$scriptstyle4$;html_special_mark_amp;$scriptstyle45$hlineLatencycost;html_special_mark_amp;$timesscriptstylentlatency$;html_special_mark_amp;$scriptstyle160+20lgp$;html_special_mark_amp;$scriptstyle3lgp$;html_special_mark_amp;;html_special_mark_amp;$scriptstyle160+23lgp$hlineBandwidthcost;html_special_mark_amp;$timesfracn^2sqrtptband$;html_special_mark_amp;$scriptstyle90+35lgp$;html_special_mark_amp;$frac34scriptstylelgp$;html_special_mark_amp;$scriptstyle4$;html_special_mark_amp;$scriptstyle90+40lgp$hlineparbox1.20inImbalancedcomputationcost;html_special_mark_amp;$timesfracbn^2sqrtptdgemm$;html_special_mark_amp;$scriptstyle60$;html_special_mark_amp;;html_special_mark_amp;;html_special_mark_amp;$scriptstyle60$hlineparbox1.20inImbalancedbandwidthcost;html_special_mark_amp;$timesscriptstylebntband$;html_special_mark_amp;$scriptstyle20+35lgp$;html_special_mark_amp;;html_special_mark_amp;;html_special_mark_amp;$scriptstyle20+35lgp$hlinetabular{table}/; $cached_env_img{$key} =''; $key = q/{}$r${}/; $cached_env_img{$key} =''; $key = q/{}$O(scriptstyle(n^2p)tau_band)${}/; $cached_env_img{$key} =''; $key = q/{}$sqrtp${}/; $cached_env_img{$key} =''; $key = q/{}$p${}/; $cached_env_img{$key} =''; $key = q/{}$tau=nULP${}/; $cached_env_img{$key} =''; $key = q/{}$(A+A^-1)2${}/; $cached_env_img{$key} =''; $key = q/{table}labelintelsigndatacentertabular|c|c|c|c|c|c|c|hline$n$;html_special_mark_amp;$|E_21|_1|A|_1$;html_special_mark_amp;Timing;html_special_mark_amp;Mflops;html_special_mark_amp;Mflops;html_special_mark_amp;GEMM-Mflops;html_special_mark_amp;INV-Mflops;html_special_mark_amp;(iter);html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode)hlinehline1000;html_special_mark_amp;$7.0e-13$(18);html_special_mark_amp;134.22;html_special_mark_amp;293.05;html_special_mark_amp;1.14;html_special_mark_amp;9.04;html_special_mark_amp;1.412000;html_special_mark_amp;$1.6e-12$(21);html_special_mark_amp;448.69;html_special_mark_amp;808.28;html_special_mark_amp;3.16;html_special_mark_amp;15.51;html_special_mark_amp;3.883000;html_special_mark_amp;$3.1e-12$(18);html_special_mark_amp;792.18;html_special_mark_amp;1340.60;html_special_mark_amp;5.23;html_special_mark_amp;19.95;html_special_mark_amp;6.434000;html_special_mark_amp;$5.9e-12$(19);html_special_mark_amp;1436.14;html_special_mark_amp;1841.98;html_special_mark_amp;7.19;html_special_mark_amp;23.12;html_special_mark_amp;8.70hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{displaymath}|A^2_i-I|_1=|A_i(A_i-A^-1_i)|_1=2|A_i(A_i+1-A_i)|_1leq2sqrtn|A_i|_1,{displaymath}/; $cached_env_img{$key} =''; $key = q/{}$U^-1L^-1${}/; $cached_env_img{$key} =''; $key = q/{}$n${}/; $cached_env_img{$key} =''; $key = q/{}$I-P_+${}/; $cached_env_img{$key} =''; $key = q/{}$l${}/; $cached_env_img{$key} =''; $key = q/{}$frac12(A_p+I)=QRPi${}/; $cached_env_img{$key} =''; $key = q/{}$Az=lambdaz${}/; $cached_env_img{$key} =''; $key = q/{}$J_-${}/; $cached_env_img{$key} =''; $key = q/{}$AX=I${}/; $cached_env_img{$key} =''; $key = q/{}$d${}/; $cached_env_img{$key} =''; $key = q/{}$j_max=60${}/; $cached_env_img{$key} =''; $key = q/{}$b${}/; $cached_env_img{$key} =''; $key = q/{}$(A_p+B_p)^-1A_p=Q^H(R^-1_2R_1)Pi${}/; $cached_env_img{$key} =''; $key = q/{}$(n-l)times(n-l)${}/; $cached_env_img{$key} =''; $key = q/{table}centertabular|c|c|c|c|c|c|c|hline$n$;html_special_mark_amp;$|E_21|_1|A|_1$;html_special_mark_amp;Timing;html_special_mark_amp;Mflops;html_special_mark_amp;Mflops;html_special_mark_amp;GEMM-Mflops;html_special_mark_amp;INV-Mflops;html_special_mark_amp;(iter);html_special_mark_amp;(seconds);html_special_mark_amp;(total);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode);html_special_mark_amp;(pernode)hlinehline256;html_special_mark_amp;$4e-14$(18);html_special_mark_amp;33.3;html_special_mark_amp;21.76;html_special_mark_amp;0.68;html_special_mark_amp;12.57;html_special_mark_amp;0.69512;html_special_mark_amp;$2e-13$(18);html_special_mark_amp;67.7;html_special_mark_amp;84.48;html_special_mark_amp;2.64;html_special_mark_amp;22.14;html_special_mark_amp;2.62768;html_special_mark_amp;$3e-13$(17);html_special_mark_amp;115.1;html_special_mark_amp;160.00;html_special_mark_amp;5.00;html_special_mark_amp;30.32;html_special_mark_amp;5.051024;html_special_mark_amp;$3e-13$(16);html_special_mark_amp;165.0;html_special_mark_amp;251.52;html_special_mark_amp;7.86;html_special_mark_amp;37.71;html_special_mark_amp;7.811280;html_special_mark_amp;$4e-13$(18);html_special_mark_amp;259.1;html_special_mark_amp;329.28;html_special_mark_amp;10.29;html_special_mark_amp;42.06;html_special_mark_amp;10.641536;html_special_mark_amp;$2e-12$(16);html_special_mark_amp;331.4;html_special_mark_amp;422.72;html_special_mark_amp;13.21;html_special_mark_amp;46.61;html_special_mark_amp;13.491792;html_special_mark_amp;$9e-13$(17);html_special_mark_amp;456.9;html_special_mark_amp;512.32;html_special_mark_amp;16.01;html_special_mark_amp;51.47;html_special_mark_amp;16.162048;html_special_mark_amp;$1e-12$(16);html_special_mark_amp;552.0;html_special_mark_amp;601.60;html_special_mark_amp;18.80;html_special_mark_amp;55.72;html_special_mark_amp;18.87hlinetabularvspace.2intabular|r|r|r||r|r||r|r|hlinebfCM-5;html_special_mark_amp;multicolumn2c||GEMM;html_special_mark_amp;multicolumn2c||Inversion;html_special_mark_amp;multicolumn2c|QRPhline$n$;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;time;html_special_mark_amp;Mflops;html_special_mark_amp;(seconds);html_special_mark_amp;(pernode);html_special_mark_amp;(seconds);html_special_mark_amp;(pernode);html_special_mark_amp;(seconds);html_special_mark_amp;(pernode)hlinehline256;html_special_mark_amp;0.08;html_special_mark_amp;12.57;html_special_mark_amp;1.51;html_special_mark_amp;0.69;html_special_mark_amp;2.23;html_special_mark_amp;0.63512;html_special_mark_amp;0.38;html_special_mark_amp;22.14;html_special_mark_amp;3.21;html_special_mark_amp;2.62;html_special_mark_amp;5.01;html_special_mark_amp;2.23768;html_special_mark_amp;0.93;html_special_mark_amp;30.32;html_special_mark_amp;5.60;html_special_mark_amp;5.05;html_special_mark_amp;8.96;html_special_mark_amp;4.211024;html_special_mark_amp;1.78;html_special_mark_amp;37.71;html_special_mark_amp;8.59;html_special_mark_amp;7.81;html_special_mark_amp;13.29;html_special_mark_amp;6.731280;html_special_mark_amp;3.12;html_special_mark_amp;42.06;html_special_mark_amp;12.32;html_special_mark_amp;10.64;html_special_mark_amp;20.41;html_special_mark_amp;8.561536;html_special_mark_amp;4.86;html_special_mark_amp;46.61;html_special_mark_amp;16.80;html_special_mark_amp;13.49;html_special_mark_amp;27.32;html_special_mark_amp;11.051792;html_special_mark_amp;6.99;html_special_mark_amp;51.47;html_special_mark_amp;22.26;html_special_mark_amp;16.16;html_special_mark_amp;35.65;html_special_mark_amp;13.452048;html_special_mark_amp;9.64;html_special_mark_amp;55.72;html_special_mark_amp;28.45;html_special_mark_amp;18.87;html_special_mark_amp;45.21;html_special_mark_amp;15.832304;html_special_mark_amp;15.64;html_special_mark_amp;48.89;html_special_mark_amp;35.86;html_special_mark_amp;21.32;html_special_mark_amp;62.51;html_special_mark_amp;16.302560;html_special_mark_amp;20.12;html_special_mark_amp;52.12;html_special_mark_amp;44.17;html_special_mark_amp;23.74;html_special_mark_amp;77.45;html_special_mark_amp;18.052816;html_special_mark_amp;25.28;html_special_mark_amp;55.22;html_special_mark_amp;54.03;html_special_mark_amp;25.83;html_special_mark_amp;94.06;html_special_mark_amp;19.783072;html_special_mark_amp;31.82;html_special_mark_amp;56.94;html_special_mark_amp;64.77;html_special_mark_amp;27.98;html_special_mark_amp;113.20;html_special_mark_amp;21.343328;html_special_mark_amp;39.16;html_special_mark_amp;58.83;html_special_mark_amp;76.76;html_special_mark_amp;30.01;html_special_mark_amp;134.75;html_special_mark_amp;22.793584;html_special_mark_amp;47.30;html_special_mark_amp;60.83;html_special_mark_amp;90.97;html_special_mark_amp;31.63;html_special_mark_amp;159.38;html_special_mark_amp;24.073840;html_special_mark_amp;56.91;html_special_mark_amp;62.19;html_special_mark_amp;106.30;html_special_mark_amp;33.29;html_special_mark_amp;187.37;html_special_mark_amp;25.184096;html_special_mark_amp;66.32;html_special_mark_amp;64.76;html_special_mark_amp;123.23;html_special_mark_amp;34.85;html_special_mark_amp;218.05;html_special_mark_amp;26.264352;html_special_mark_amp;78.60;html_special_mark_amp;65.55;html_special_mark_amp;142.09;html_special_mark_amp;36.26;html_special_mark_amp;273.52;html_special_mark_amp;25.114608;html_special_mark_amp;91.35;html_special_mark_amp;66.94;html_special_mark_amp;161.77;html_special_mark_amp;37.80;html_special_mark_amp;313.53;html_special_mark_amp;26.004864;html_special_mark_amp;105.56;html_special_mark_amp;68.13;html_special_mark_amp;192.56;html_special_mark_amp;37.35;html_special_mark_amp;377.39;html_special_mark_amp;5120;html_special_mark_amp;120.80;html_special_mark_amp;69.44;html_special_mark_amp;216.21;html_special_mark_amp;38.80;html_special_mark_amp;407.42;html_special_mark_amp;27.475376;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;38.80;html_special_mark_amp;493.26;html_special_mark_amp;26.255632;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;38.80;html_special_mark_amp;554.36;html_special_mark_amp;26.855888;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;38.80;html_special_mark_amp;628.69;html_special_mark_amp;27.066144;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;--;html_special_mark_amp;38.80;html_special_mark_amp;699.88;html_special_mark_amp;27.62hlinetabularcenter{table}/; $cached_env_img{$key} =''; $key = q/{}$barcalD${}/; $cached_env_img{$key} =''; $key = q/{}$(A+(r-mu)I)^-1(-A+(r+mu)I)${}/; $cached_env_img{$key} =''; 1;