@@ -185,13 +185,15 @@ export default function UShapeAttentionCurve({
185185
186186 return (
187187 < div className = { containerClassName } >
188- < div className = { styles . header } >
189- < h4 className = { styles . title } > Context Window Attention Curve</ h4 >
190- < span className = { styles . subtitle } >
191- Information at the beginning and end gets strong attention, middle
192- gets skimmed
193- </ span >
194- </ div >
188+ { ! compact && (
189+ < div className = { styles . header } >
190+ < h4 className = { styles . title } > Context Window Attention Curve</ h4 >
191+ < span className = { styles . subtitle } >
192+ Information at the beginning and end gets strong attention, middle
193+ gets skimmed
194+ </ span >
195+ </ div >
196+ ) }
195197
196198 < svg
197199 className = { styles . svg }
@@ -406,14 +408,16 @@ export default function UShapeAttentionCurve({
406408 ) ) }
407409 </ div >
408410
409- < div className = { styles . explanation } >
410- < strong > The U-Curve Effect:</ strong > The curve's width shows context
411- length, while depth shows attention quality. As context length increases,
412- the attention drop in the middle becomes more pronounced. Short contexts
413- (30%) have minimal degradation. Medium contexts (60%) show a noticeable
414- U-curve. Long contexts (90%) exhibit severe attention loss—only the
415- beginning and end are reliably processed.
416- </ div >
411+ { ! compact && (
412+ < div className = { styles . explanation } >
413+ < strong > The U-Curve Effect:</ strong > The curve's width shows context
414+ length, while depth shows attention quality. As context length increases,
415+ the attention drop in the middle becomes more pronounced. Short contexts
416+ (30%) have minimal degradation. Medium contexts (60%) show a noticeable
417+ U-curve. Long contexts (90%) exhibit severe attention loss—only the
418+ beginning and end are reliably processed.
419+ </ div >
420+ ) }
417421 </ div >
418422 ) ;
419423}
0 commit comments