ࡱ> `!2 :"W֦qY3-|6=5]`Z xݛolGgnogwo[*VkqRǎKF DAiRuDD/n)rDJ|B@SOTV#@*! hCٷsoߌ}>N*3潙y;;VAHjjBL0I)h^j@ U{GZ!gp~b$WkyUP7hG}cRHg!"+X\~{uJ}{_&EU=zb}G݇ *ox;d퉯oEhM8[ZR>UHo۪3J X'_M^z_J#]yr5!KJqjHd@/3mҳ>8d_ғ i>}݅R-jgK]|4vWެ^nl7EfL% % ٱ4cidS6PP'2ż+Y2rӹJ{e ܐͺhF$Qdt ]#uqVa z&Z3Fݴ} !!;.p_C9U྆R྆<),9n@7G#ts9n@.5-!^8+)d,}@liXArrvu:264g)26 g2vMd,Brqv/d]l}} -Ύ;XCr^5hFrmv9n' آ |m\[ ~\W#,e%KXS\guk jgUWA)jd|>9ޝEy±L9ȼdU d28#O9 Cx; 34*B ']_ =fٙh]*lZ{8‚x Ew4n?2a~^Oѧ)uWamT0&dRٙ糛2Pb* 糍 ƧLi=ա7~mT0WȤWJܝ}OX -TM.ǂg&$̡2v%Jcu{fc\&1{sPl~@ `mIu5?iCI1Rw"+MIu>~^\hguvk!gH~"\oR_1^oWQ1r J$ Fd}oM{~=!_ftoH4H& B?w#Q=U؛ nosGZG ֻFhm8Z{T Zd@B*ض{zw;ۼ++n)ދoΠ͒;h Z9s:SɮsY2j56B̺j܅tݳvP>?2˳Qhoo'3Y$ɐD{TL^v_,zAn_ 陷RگMvN~ڧ{k[n{2@"YK ' ύZ 蠞qJ̺A~cCYzBfX=]Q`HE}Ǹ}'Y\IPTE^ [e##-WW|E6wrGxחJgU:Og+5L^/{ɺǶVZuNµzZz|Fb1p5c~FI(Qc6J/Xxg.{G/y3;rkDoSk'jo~>]M?N--?[Օ{\FTn/*bǤi(PNG  IHDRmQt*gAMAPLTEٟ IDATx}y盝Yb W\Xh Ū:_}RIv-RRr K e_$WR"bH++&[Y-(fY6%1 {4LN鞝m/3ݿ{fx;3)Xi'0X\I/B/e xvۧܲ;u?2"|RX^X{*|"x J". |cvQL6Rf0˯Ɍ`3vͧy 6}Q@0Qy|3d^Uγ}u)zoc>}}|-jiE*_F<= _sCЧ<}dY%ٔ*M ?5L=}J>Ԫ{®&XGMߦGivw<<"jwnY`WV^,Ѣr((1s)Sݦ`|/#y%4Np !xݔ izld&VGdm]-DݯKJk~u"p4)| (^Oze-/]r/apXp϶stcyg[~G&("iz*B*FKszf[9ƻ0X!&M ,ƮwrHjlMշj?>Hf@Uh QW$*ywr`hٷ(~-iUQh]"ԉ1IՓ/3 mIArD]7 eiiQQsj}lxbY5@O7 g+8&]$iG[s1z9ń@wj>n1n妧Q]]`㚯WP/]O'^»5PkXu& ߹b[fm2iif0ņ_ U5F[M4O¥|O}nWQi^EO)DDzp՝66hK~(r1_߼^å~11hZ'`&,)6bKH'%em9ddZ<9ѓgtsa51/6N_h(| B)> W<$:$"ߏ?} pGM ÎLȬY yW$}ڴ;9Ciܐ7TX\E5g=]j\ނg\Iϐ ,8 U䄨OӇo`*PouCN\'ro<9* QJݛ 9Z78YvЄ R7oOf2-FMu7E0grQWu.L: W/OJ84o,a*iٓ``:KҊ>竾Xzva##&SpޏQc(aťoyT6Ew"ai v?|zF)yLZ7d|2e.Q_3bj`I3-]7|7K)l,o &Zv=CiBkԉ`\CĿ0iDR(uX짿0,`WO[8e'C+XL/S#0"%)|ld)27m&/!aHybx_[f>3w3NN8$"닱z>gCs ѳ\/j-2twI:8l(ϔ;$LڒZr 8l//8`J -.XjL9UW0~kp')߼#s{p\\&raq/dHqĻ5fuJ _G^LWP@0IGPShw<-Jҡ|;G{DO[}YY8}!k6F 352\Tg!K{B"m'['Qv#œ+. aރ3DSB#Gu!|_Ӣlhy` U1be|Ž ݁G܋yd.Zu53_[~DFvq}S3U R+[zo M&2/:׽b 1@tO'J?'N:VyQrWBwafųK +Mxz.ȰG,R*wxjv8:BIWhkcU췆h Io]Yp W[=T0`Q7"oSK|d> )T$ml:x+=ek<OO FR&V,]oȲ~ 51NRIQOHY3l<)0u:&-t0);;>c2\̍?K/xc~{Sl(v|^/ m4ol QRӞfC=4"_xv5ɹ*X1:z_\s8< &) nazwOoj^؞A7d~g|iefz|3V:{/ <9>Cگ;J7IER4@=Zцi~p*m%ܽK?L>=LNHy%=LTZf w><߱::Zi3 V4LGo ]}T1c 5%wl.QSA h]ߺ]%z]t1Cl0;vӶ# /tN"$KMFY;@Qqp*\d5 , 7Uѻ tiguslv0 SvVH8=NyeS(TBI}pY*E-DҪ bw2֯?->I K|׀^7> a-A*zގ+>. ̫<"duSψUiEC?B_ަj|_Q_澻Jw9̙h5rT/#{ W؝?C.VJ},U."TQpuJ;d/$Y u2R߹Ns`j~OTr6sx;zCAZQ%cGCFzQ0'3B :,6Z#K R S`9˄.y M\.SbH8H*["l6BF8-M p{Np # 2cY.:8EGl%;W%ljL"m a 05#u̅YQ?6qxZI ~tW6/[2M[}9rq'QqeӤ"|֤b<HJ'rLv 70]TH_U)=e$KCfhzz&PT#d$o[ga9Y>Hpx11e:I?b/iX]nFpHح'>O挕#N+~e@!OP8OYC (*ojreC,+Ԋ{FƔ.6wKq9*ڬxΏqL# KijEӇo͚+H"~A2'M&&.{Q!&vTW ROI d;ً/i|h+eZ ȩUcx )jM#=l=Xzqׁjò)dxif?fn7Z_VMi٣FgpPwRm,F?KP{Ie76jJ?-H)y-p9٫<ijI_K95mzZ!3 6,U}h!\ Ŋj4E}JQ4ШI:n/1);]=Wnl9D oSӴZjz.YQ0!'iks*Pn){H:ÓA[I=KMiW-¨$a ?V?N6uo '_ގqN"oID̛'왧#oQpi8,8cၢjmΎ) x&EĆ0\%ƔEpNҦud+W W"*ۿDŢi5 x/ S=GK Lv0`FU%|))"!aP L M4m'eAh!852/{'P#[&X~b@ݳk8J^K`xHnݐ7h c`]f{'Cp988nɷHkر$iPZC){l:̼8d:oX$:JSFwYG 0zT8"w&<A$q*Bx'Hލ|2IZ¢$ՕZBe#BHvܠjD8)jM:A2ZirL$ɀur:w6~.jl YDE>FGy@~ KXXۀ`gCrʘZŒe#+KǤTlo=0+6׆ޥ`CyN4F(4NW,vϙdfSC3(۲!hHxz-=69졿 ط8Mxis(WlJ0}2ܷЀW9{:ԜO o [l#!QጞaeW8Wl:g=;2Pp8bfeV >~A, 08+!?$RﳤibHnݽAoI:1$`<_ Qɬ]w,ՄucFD9_7vKIyl&L5ᇑŠqAILg̼D;z٣-ؙo\G7Ͷ<EոXG7)qCaAіH"q/d)lT"4y/*Bml(։[*XC&vƸeeM Q6Tl>ja +g)6Մ ̮/9f ؁\54ҞG N 6˕[F/l÷II?ls&uz覟m?Tjl#HlFtZQM-9l-@&MI Τ,'!/~Q`_mA{WS[PWr 3 T" )`7%SY0j6f(`!hD-e<~~T n91FM%wyO umk]xI!E{h6k"+^a[?VI^vy9'T 3$7(=mIўYpD^gcM,>ޒwCnML H8krxܕa{0z%PI3al,6y%NP_ MO0<?cCl &R:Y}Ea[aW'[~}EΚ1bOLWV4=V66R쫓38QޭkRNϱ]K5(.$sQMڽb{bCr״3{,؆ +,rz&0<0 *Ne!B|Mw=& Ņ&nk; ϾmBuWYl3R 7=Y;Yr_h\(M{NsRwvQ~=Vpz;۩e]S?RIdjѱ5Je{lÎEsZTԷ!(pUDwn:i .D:ۘa!ng?2K4W Fo6B=؂e=<Ć6QK@܂n>0CHQYN^;pe0 g Tx; AX42K ړ-ݧM⿶ZSfjc JܰڨdF飜^]38Lp6K9烷Oiκ|u`ܛMan84!֮K#x @oi^N=x!'0ʣ8-af8B/( (A =5S~1j]6U9e NLsk-6x[4Djy@#8]@n`YNz|OZ$5֨aB"2*E 7ZIىԫP!i5n|FpS=`CQJ&ӡCG ;~#{T>Ӹ97qiѺo~M3Zh'K %X걼(טt X+&=xͰT@LFZh>%CAv: 2Ӗj;u:>b ZQE0*GN^ND̨7ZÐČh]kb#T':`'DB/:0szcJqK> AviDn)*]#<;LhdAk:J/QAe6"ԁ87.1 u> -!?<1(yLÃbw=p8kvvUJI JùixBU* X׮ ξcׂ[:m37ƚ>p;'y5oT̪][|A<ߝ/i.LwuT#w&c#?.PZ_}bcSWոs߀B:ԽNQczh]B 5J]ޘ2a;&w=8yIU1޺kGa&val&~F})3 LIajSlzu^m\׫w|<.Q0# ƒ 8|{у&V ?|z+=*ޝzK3bţ ]Hqo(cR J>S5]7ۭzT3 W:`{@.F39.m$"b"oW䛲'z h>҉_o h[w&<‡U: npfm> r17] f3ah ]o ߑ*Icw؎C̔0Z@o";Gxz9+PJQĕw:ޤ^j~l /*xyO`eJϋR#$q(:Z^D~KW8MᅵEy+'xq]]ᶺEOA=CQK_So(y" /\3d`w8$Ťü; \9ִQw_)q5?(/zk^%L:gw T~՞81֝zE2s&΋Xm5c_aZ M3;M3ȒCk];:AJ ptdċ5_^ 7w~#ڢ*yDJY+RaA~p޹Np>A/xDؕvt /UN |~nOԆm֤ ߋ3LFd}f^*/uE;VV럖e?X%4A":lem ZO\V@.u˷Z|#r@22stoܯh[d=QfJ>p ̓#ȃ$LDD2Ko-'6R0u*b"nȀ>;|"&f|N͏"sѵ"VHGi5ԉ]/vi$<uP| :~Y}%ŬDɱTgu@G lCm~(~5੏ڧ{"KЫcKpZ8AKA0u .7Ǵ sc5 \~X/G f5}l/+yEx8~V(ui*:NuT:Yۑ5 foDD"/pI:luQՖ_>sר!W_Ka]8J4mؼ/LQ8֯2 @b<ǝNޣ {_F{%#{5,׆5vG_A^z;͎68mcu't~Vzƿ_;6x>|#G[#Z/yJ~}kVt2NmteeQ^|#?x#Yw PرBu18f^/kl/#;mpM`p;SXL%KסW]¤+^ޕ٤8F[T3u縘"OVbvs[ w/u:;k.вx {pKtY ?*c4X wfcd 6\:;U aE$3/a.zSn:~gWw:V_O2yzIENDB`zawq1v&( wwwwn|DA`nw|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(P cFumow?cɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ% /)J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%D?Iɭo߉G%hmd7/ =? o/U[|߽=MN'"n zC|! ?wo_TzC7|aI"4_lԛ97XCoo\ooEIџ7ɗ]f~MUkS4||ԥ: !_v˱C);ooH :uB)Jo M œM M.N i+_9n-Y||ԫ:n-_;,\ ~|C/#ӽ_/ߟ̴LN?nk[7Η9n/8_f|7Ho}75BV0|q,8_仑 ޺y||ٓ T˞uw0|Gظ| 3ɷ|<$~k? 3)&q仙'3f'߬aC [.w0oa~'a_#|`0O>0|hWNjwu_70u ?|h| 7/ͽ-k+ҿϒo_ǔ7y %_0=aN6˽',:s&|%/&|ćFna׿t9[}o!_0 Ks^!_0huy|˜b['_0xo! į>[8M _0 n+FBM•y|ˆOx|aCLUMZzLMs5_$$_3r#LE7 Ozrf/~Iou^._PL}D7 .$u µMEo s5_||F>4|.LUm #zV0|u|zȇ/poo#_o0a n#m #F>4|/zK|aCȇ #zSşX;||mt~M񝶫VʗrZ+eG;wؤo4'(_G!M^Q@o`r|3 E#7׆|`/jk)A^/X}ؗ|v=>ʗ狎CDڔ/9˗Ћ߶/˗^k&^,_2m0/E/~2W ˗|鋑|ዟ|9^|K_t+_oX2|~﹭2|Y`[G!0_ރ||ڰf]j|G"0߈^+ _ݪcnp΍9po~zw! _2.sdm2Yܨ^Zy $DS M KPS8 ڌ "-jkhs&-\D`PC[N "_fmh&3Rie{Rie"_79oorwF/X3k>f}`M%|3}y| ߌi%|3}牟|-7c|G/X3VCtm𽧃wh|-Dd|M2|ftn!_7k|7'ߢ|N:N}&˷/} -Ho&;,'ȷ/ѫ{>7Y "_uhy/o7pdV R |3s #|_|`x{xxtP"_8M3Z]rv/fU;?\mB7P8o=;q|_@]-/~xY/Ny`7#+|1_tb;2||VN/<:ăm;5/(`/ We ~竣/uj&*8|狇 &~|$J xNw||}]&ұ|cC%f⫒5ECoI#ߕ|jFd,N oVɷ$_0G0V%_zN'ߒ|“O[R߇|c|o%_<wdp;Uu Kns _.I|ݍoh~ ځ/7!_v`4_|#@ɷ&_pl/H[Til72||o'ͷ|6yT[!w;0{{{vWfgn;:P|jpfm򞝯IU{0wkɌq}qm(G˝x<;_uX0bǎg;.ok|Ǜ-Ʒy[1wvaw||`9n72\ݳ~Z{˳wo_) Ow(Yj|6 }n9qˮ{fnۅ&~Owؿ>{~hߌ=񵟻|-4o~~R|?~/4o~~#{dގ|C0~ s?1_S: w,f1oOo+wkǽ0e5G_[5_wvjǽ0%+-so~[+|_G]=}UѾo[=/U݁oyJ>F>4b|_O<|ݎgǽ0O$|~gzV>G[[]wx>|Lw_=!|_o||?̷;_-w3_|#;h~s;Ug}eOi仝v[c||ՑڽyU[k|7y]ّ}w _?/nNtC?#_{/׽dX|owuhw[=O xG_y {| FeP?e[Mu&ҧ6w [~n鳶;~nӎ>^oӎvKϛo-=ot߽~}}oݷ߉텿xx_{7ӷ׻EzNvnf|z+&ټ-z Quq^|_;~܉_RӾgމKxocGp[oy ,ߒ|m=Yo.wU<-8 E"z| >{Cm=ņZ3=-_YO̗/|7GX'=GWg6~#ǒ%J>TW?zozɇUF>RW=zozɇ% Ϸ{|2O?zozɇ*y\*G>RW?zw.ɇU_ѻsI>T|On}|;P,MomK>T|Co7V67|9Uٽ -wO˫t"|(}GBWѦW߭B_v?^3/Ɗ/Y?-PEhī[F xZoFW'kW)|W|د䋧&!_ny>BT&_BuWi[}KOQ҅ ֦RMm#ܩr^n^wּ7Rr&5ͽZyNߪ;U_:Amf+Pmg~;VާU4ﴣ^u 7oWݧ͛U yuw$ j|+_$vߪ[V>Ҝy(^ߜys.7g\K%͙77RI|s+QQ|I X_;ɷSN}-'~k_H(_7=sWޣg.;Tfo*[em'֞75sYdeM\w,K75siޟ6|Oa|_0C-oES^}wJی;mG?7v}EK;-o쬷ZwJ;6Mq|m{S_ر[ͻǎ9;Mq|;S_srǎG9 ˽g#G|s})/})o!/}% =䥯D!R"cvDǼ7"2_&z9ʗ>{-/ڑ2gG=w 勏ͣP]5ޏ5)Q(/8x|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(PCɇ%J>|(P_I;ChIENDB`zXYJ-X kA(t  X##XOO66)OO7XX##F##UXXcOO66rOOX##X3(  @ vhttp://developer.intel.com/design/itanium/documentation.htmvhttp://developer.intel.com/design/itanium/documentation.htm"f/design/itanium/manuals/iiasdmanual.htm#applicationhttp://developer.intel.com/design/itanium/manuals/iiasdmanual.htm0application\/design/itanium/manuals/iiasdmanual.htm#systemhttp://developer.intel.com/design/itanium/manuals/iiasdmanual.htm0 systemF/design/itanium2/manuals/251110.htmzhttp://developer.intel.com/design/itanium2/manuals/251110.htmD/ 0|DArialtury BookTTwܖ 0ܖ"DArial BlackookTTwܖ 0ܖ" DWingdingskookTTwܖ 0ܖ0DTimes New RomanTTwܖ 0ܖ@DITCCentury BookTTwܖ 0ܖ@ .  @n?" dd@  @@`` H3233+  9;<=>?3   ,, abc&efghij lm2$:"W֦qY3-: b$*bǤi(/: r$wq1v&iW9$$$$$$$b$|DA`nw%;ʚ;ʚ;g4dd 0Rppp@ <4dddd k 0Tv<4BdBd k 0Tv 0___PPT10 ___PPT9vhttp://developer.intel.com/design/itanium/documentation.htm?  %u"6Confessions of a Performance Monitor Hardware DesigneriWorkshop on Hardware Performance Monitor Design HPCA-11 13 February 2005 Jim Callister Intel Corporation jPI!,Why Include a PMU?Ya gotta do something with all those transistors! Cause my PAPI told me to To give competitors a fighting chance To show my boss how great my branch predictor is (ie., get a raise) To improve the performance of current and future systems4  9$6I/=How much Performance would you give up for PMU Functionality?*> Transistors may be  free but& Wires are not! Design time costs Validation costs Documentation costs Time to Market costs The answer is not 0% PMU proven to improve performance But it s not 10% either!tZ[ZZ"ZZ["70What to Architect in the PMU? Machine Architecture is a contract between hardware and software Architect too much& Lowers performance through design constraints Events don t map well to hardware Architect too little& Jeopardizes Software Investment Discourages Software SupportTWZPZZ=ZWP=1Itanium Architecture: PMU& Architected Access & Management of PMU Resources PMD registers for Data, PMC registers to control PMU Counter Overflow Behavior and Interrupt Handling Only a few basic counter events Implementation Dependent Number of counters, width of counters Non-counter performance monitors Events: Encourage use of CPU-specific tables Itanium architecture protects OS and Tool infrastructure while promoting performance and full visibility Z%Z5ZQZZtZiZ %5Qt  i2VPerformance Events  Let me count the ways& ,,bWhich events are important? How will the events be used? Do you really care about a cache miss if it doesn t cause any stalls? Mapping an event to signals Needed signal may not be available On critical path, lack of wires, no signal Combining signals is problematic Distance between signals, timing, logicc#+!(c#+! (@ Itanium 2 Processor PMU Events*  4#Where are the Performance Problems?$Counters only give type of problem and magnitude of the problem Use filters on counters (hunt & peck) Itanium architecture currently includes: Opcode Filters Privilege Level Filters Instruction Address Range Filters Data Address Range Filters>ZdZm "d^A!+A Better Way to Locate Performance Problems,,Event Address Registers (EARs) Logs information about a single cache miss The logs are sampled by software Creates a statistical profile of cache misses Branch Trace Buffer (BTB) Logs information about consecutive branches Logs also sampled by softwareTZzZZJZzJB"Lend Me an EARInstruction & Data EARs Log Instruction Address of Miss Data EAR also logs Data Address of Miss Log Latency of Miss Filter by latency bin Have an associated counter event Can also log TLB misses And where TLB miss was resolved Have proven to be extremely useful (c # (c   The D-EAR Shadow EffectC#The D-EAR Shadow EffectE$jThe Itanium 2 Processor s Branch Trace Buffer (BTB)*6  *)An eight entry Circular Buffer Each entry contains either: Address & Prediction Data of a branch, or Address of a branch target Uses of the BTB Mis-predicted branch profiler An efficient Instruction Address Profiler Path Profiler Cool use: in conjunction with EARs Path leading up to sampled miss!;ZEZZVZ#Z!Z;EV#!  ,q"F%pThe Itanium 2 processor s PMU Helps Improve Performance*9  -G& ConclusionsWalking a micron in HW design shoes Balancing PMU functionality & overall performance We need to move beyond counters! Itanium 2 processors provide EARs and BTBs What s next? The Itanium 2 processor s PMU has much to offer Customers are making good use of it Would like to see more use  how do we do it? Discussion What is the long-term vision for the PMU? What can the PMU provide to improve current and future systems Did anything  stick or resonate? $Z2Z!Z9Z0ZRZ ZZ$2!  10R  ,'H',For More Information& .!http://developer.intel.com/design/itanium/documentation.htm Manuals Intel Itanium Architecture Software Developer's Manuals Volume 1: Application Architecture Part II: Optimization Guide Intel Itanium Architecture Software Developer's Manuals Volume 2: System Architecture Chapter 7: Debugging and Performance Monitoring Chapter 12: Performance Monitoring Support Intel Itanium 2 Processor Reference Manual for Software Development and Optimization Chapter 10: Performance Monitoring Chapter 11: Performance Monitor Events N";   J4Z"UcTP 0; 0J 0 0~/8Dr   0` f3|` 3f3` ___>?" dd@ 33?" Pd@  d 33" @ `33"  n?" dd@   @@``PT   @ ` ` p>>L0   T (    Z݇gֳgֳ ?"P  T Click to edit Master title style! !B  N|gֳgֳ ?"  RClick to edit Master text styles Second level Third level Fourth level Fifth level!     Sl  6331?"(l  61?"Xx  BA ?"`p  :A  dot2"=p8T `t  " ,@tB  B 6D>"t    BCDEF( @`"6tB  B 6D>"`_   0` " `   xItanium Processor PMUF   33.33& 33   0 " @  F*     0$ " P @  F13 February 2005  N  6޽h? ? 44̙ff34,___PPT10 . $Blank Presentation $ 0L0  e(  l  6331?"(l  61?"Xx  BA ?"`  6 "`0  T Click to edit Master title style! !  0 "`  W#Click to edit Master subtitle style$ $N  6޽h? ? 44̙ff34,___PPT10 .$ 0 zr@ (    0M P    P*    0     R*  d  c $ ?    0P  0  RClick to edit Master text styles Second level Third level Fourth level Fifth level!     S  6`V _P   P*    6\Z _   R*  H  0޽h ? 3380___PPT10.P1;% 0 RJ (  x  c $`0  x  c $`    0$ J Intel Corp. 2005( 2"H  0޽h ? 33___PPT10i.~+D=' 1 = @B +o $ 0 \(  x  c $HnP     c $ r<$ 0  H  0޽h ? 33KC___PPT10#.. pJ+[W_D ' 1 = @B Dn ' = @BA?%,( < +O%,( < +D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*2%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*2K%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*Kq%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*q%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(+8+0+0 +s $ 0 \(  x"  c $tP     c $u<$ 0  H  0޽h ? 3fffff3̙3f̙OG___PPT10'.. 胶+FD' 1 = @B Dr' = @BA?%,( < +O%,( < +D ' =%(Df ' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*.%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*.@%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*@Q%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*Qe%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*ez%(DZ' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*z%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(+8+0+0 +$$ 0 ##*2"(  X  0P   0hP  ? PMU Central ( 2 X  0  @  0씐   ; Collector 2 X  0p  0(`pG ; Collector 2 X  0  00 ; Collector 2 X  0 P@  0t P  ; Collector 2 X  0   0d` G ; Collector 2   BC DEdF,AA hZFS88*Q"zP#!D@          BCDEdF,AAP)/=FU|_rlfwZ?$F 3) hu@        i  B\CLDEdF,AALCK6f$ \yC<3.K7Z \ U S @        op @ HZG&HVI&oj"  BH^@IZo  j" @ BHIo   j"  BZH@Iho ( Pp  HZGr}HIr}o x  B C DEXF(AA  WK3'l::ibE@          BhCDE@F AA v9SHZ^hhzh\K32",* @     [ }   BFCDELF$AAfj3/1>?iFE?E_M @      L "  BC2DEpF0AA=4_7#ATt -=82\./%#@         A   BC1DEXF(AA1,Q a@4_ ;P"zR(:7I_@         BCDEXF(AA4uRE^ODtl h^K;x@       #  ! BCDEdF,AAe5/+6{=qX)b P@          " BCDELF$AAfI+"`EPyBEHOO@       C  # B]CiDEdF,AA >oDJJQaw%5`?.;i&G-;z>bSR]=@        @]" $ BCDEpF0AAoA<R+ixui1 Zuu 6/*"@         r PZ % BCDEXF(AA /Ko90#Tp{p2P(E' @        & l  & B%CDE FdAACC%>}yvvrmd^iLK<0. |jT;)&Esho =9#/%"*.3 86$h/luHR'R/0@                      P  ( BCDEXF(AA @(SHd{1^ E@       @S < ) BVCDE@F AA/C@m Hmi-<VV @     6 * 0`` [!The PMU Has Tentacles Everywhere!"( 2"2 + B3C%DE|F4AAl%Z SC9+!nnSI=?S/h/$ *31e#D5 + @           , BvCDELF$AAvBtHf6& {P 6:==@       N  . BCDE@F AA5W<kX  (/<< @     xIn 0 BUC/DEXF(AA)U6I0s%"^WSJB5.)-(/  @       B 1 BCYDEF8AA""TYZ3eHsaw  @G`|wf>4%  @ K$Y-P@           @ 2 B%C/DEdF,AA#/!$ %L0  @        c Ns H  0޽h ?_    3fffff3̙3f̙___PPT10i. $+D=' 1 = @B + $ 0 0(  x"  c $ؐP   x  c $xِ  H  0޽h ? 3fffff3̙3f̙___PPT10i. +D=' 1 = @B +L $ 0 \(  x"  c $pP     c $p<$ 0  H  0޽h ? 3fffff3̙3f̙( ___PPT10.. M+FD' 1 = @B DK' = @BA?%,( < +O%,( < +D ' =%(D ' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<* %(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<* 1%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*1f%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*f%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D ' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*D%(D' =%(D)' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*D%(+8+0+0 + $ 0 \(  x"  c $hP     c $h<$ 0  H  0޽h ? 3fffff3̙3f̙___PPT10.. 0 +FD.' 1 = @B D' = @BA?%,( < +O%,( < +D3' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*9%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*9%(D ' =%(D ' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<* %(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<* 2%(+8+0+0 +W $ 0L0 VN0%t(  tr t S  P   4  %t #"2&nnnnnnnn  t < ?  K443 @` t <?  KTotal @` t <&? $   J20 @` t </?$  dMisc @` t <8? $  J73 @` t <LA? $  IBus @` t <I? H   K150 @` t <K?H  u Caches & TLBs  @` t <[? H  J69 @`  t <d? H  NBranches   @`  t <m? l J42 @`  t <u?l  [Instruction Execution @`  t <L~? l J89 @`  t <? l VCycle Accounting @` t <X?  XNumber of Events @` t <ؙ?  XEvent Categories @``B t 0o ?ZB t s *1 ?ZB t s *1 ?llZB t s *1 ?ZB t s *1 ?H H ZB t s *1 ?  ZB t s *1 ?$ $ ZB t s *1 ?  `B t 0o ?`B  t 0o ?ZB !t s *1 ?  `B "t 0o ?H t 0޽h ? 44̙ff3___PPT10i. EWR+D=' 1 = @B + $ 0 0(  x"  c $P   x  c $̤  H  0޽h ? 3fffff3̙3f̙___PPT10i. pv+D=' 1 = @B +b $ 0L0 P||(  | | S (P<$ 0    | S (<$ 0  H | 0޽h ? 44̙ff3___PPT10.. p-N+ D6' 1 = @B D' = @BA?%,( < +O%,( < +D' =%(%(D' =%(D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|%(D' =-g6B fade*<3<*|D ' =%(DP ' =%(D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|%(D' =-g6B fade*<3<*|D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|J%(D' =-g6B fade*<3<*|JD8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|Jk%(D' =-g6B fade*<3<*|JkD8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|k%(D' =-g6B fade*<3<*|kDh' =%(D' =%(D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|%(D' =-g6B fade*<3<*|D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|%(D' =-g6B fade*<3<*|D8' =A@BB BB0B%(D' =1:Bvisible*o3>+B#style.visibility<*|%(D' =-g6B fade*<3<*|+p+0+|0 ++0+|0 + $ 0L0 `~(  r  S ̲P   r  S Ͳ  R  C *ACKE50001` H  0޽h ? 44̙ff3___PPT10i.  EG+D=' 1 = @B +F $ 0L0 IA@(  @ @ s *<ղP   {| @ T1?`2= @  nA1?25%6= @  nA1?25%K=B @ ZD1?=66B @ ZD1?=KKB @ ZD1?=PPB  @ ZD1?=B  @ ZD1?=\\B  @ ZD1?=B  @ ZD1?=  @ # l<߲@E@E1?} lMiss.0     @ # l@E@E1?% `Miss"0 2  5 @ C xD@E@E? 1?C F  Miss RecordedF0( 2 0     A @ # l@E@E1?BQ  Miss Recorded^0( 2 0   r @ Z1?rY9 @ # lL @E@E1?H 0 =Without extra hardware, these misses would never be recorded!&>0 2>   @ # l@E@E1?L(  rLatency Counter Busy$0( 2    @ # ll#@E@E1?*V pLatency Counter Busy"0 2  H @ 0޽h ? a(___PPT10e.+D=' 1 = @B +w $ 0L0 zrp (    s * /P   {|  T1?`2=   nA1?25%6=   nA1?25%K=B  ZD1?=66B  ZD1?=KKB  ZD1?=PPB   ZD1?=B   ZD1?=\\B   ZD1?=B   ZD1?=   # ld0@E@E1?} lMiss.0      # l;@E@E1?% `Miss"0 2  5  C xdD@E@E? 1?C F  Miss RecordedF0( 2 0     A  # lY@E@E1?BQ  Miss Recorded^0( 2 0   r  Z1?rY9  # l I@E@E1?H 0 =Without extra hardware, these misses would never be recorded!&>0 2>    # lh>@E@E1?L(  rLatency Counter Busy$0( 2     # lp@E@E1?*V pLatency Counter Busy"0 2  E  # l@E@E1?p  !The Itanium 2 Processor SolutionN"0( 2 OOO    # l4@E@E1?  @Don t Track every Opportunity -- randomly pick misses to track Tradeoff: shadow mitigation versus sampling frequency Use LFSR to decide which port to sample and if to sample Every miss has ~1 in 8 chance of being tracked This mitigates the shadow effect, does not totally eliminate it Customer feedback indicates it works very wellpu1 2h1 2o1 2uhn  H  0޽h ? a(___PPT10e.+D=' 1 = @B + $ 0L0 $(  r  S {P   r  S X|  H  0޽h ? 44̙ff3___PPT10i. 8g+D=' 1 = @B +  $ 0L0  (  r  S @P   X  0A?  0짶 )Performance is measured using specific computer systems and reflect the approximate performance of Intel products as measured by those tests. Any difference in system hardware or software design or configuration may affect actual performance.  2H  0޽h ? 44̙ff3___PPT10i. `C5v+D=' 1 = @B + $ 0L0 M(  r  S tƶP     S tǶ<$ 0    0\ʶ` , 2 a  0̶0 * Itanium and Itanium 2 are trademarks or registered trademarks of Intel Corporation or its subsidiaries in the United States and other countriesT 2 * " *}" H  0޽h ? 44̙ff3___PPT10b.. ';+FD' 1 = @B D' = @BA?%,( < +O%,( < +DZ' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*$%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*$V%(D3' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*Vw%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*w%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D3' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*2%(D ' =%(D' =%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*2=%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*=g%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*g%(D' =ABBB@B0B%())))?D' =1:Bvisible*o3>+B#style.visibility<*%(+8+0+0 + $ 0L0 $(  r  S P   r  S   H  0޽h ? 44̙ff3___PPT10i.+D=' 1 = @B + 0 DR(  Dd D c $"7    D s *n @   < .33MMffH D 0޽h ? ̙33# 0 R(  d  c $"7     s *?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_`abcdefghijklmnopqrstuvwxyz{|}~     Root EntrydO)PicturesaWCurrent UserSummaryInformation(UPowerPoint Document(,NDocumentSummaryInformation8Root EntrydO)0zPicturesaWCurrent UserSummaryInformation(U     ՜.+,D՜.+,d    On-screen ShowHewlett-Packard  Arial Arial Black WingdingsTimes New RomanITCCentury BookBlank Presentation7Confessions of a Performance Monitor Hardware DesignerWhy Include a PMU?>How much Performance would you give up for PMU Functionality?Slide 4What to Architect in the PMU?Itanium Architecture: PMU,Performance Events Let me count the ways Itanium 2 Processor PMU Events$Where are the Performance Problems?,A Better Way to Locate Performance ProblemsLend Me an EARThe D-EAR Shadow EffectThe D-EAR Shadow Effect6The Itanium 2 Processors Branch Trace Buffer (BTB)9The Itanium 2 processors PMU Helps Improve Performance ConclusionsFor More Information.  Fonts UsedDesign Template Slide Titles8 8@ _PID_HLINKSA<http://developer.intel.com/design/itanium/documentation.htmBhttp://developer.intel.com/design/itanium/manuals/iiasdmanual.htm applicationBhttp://developer.intel.com/design/itanium/manuals/iiasdmanual.htmsystem>http://developer.intel.com/design/itanium2/manuals/251110.htmPowerPoint Document(,NDocumentSummaryInformation8