SVD Decomposition

$\newenvironment {prompt}{}{} \newcommand {\ungraded }[0]{} \newcommand {\npnoround }[0]{\nprounddigits {-1}} \newcommand {\npnoroundexp }[0]{\nproundexpdigits {-1}} \newcommand {\npunitcommand }[1]{\ensuremath {\mathrm {#1}}} \newcommand {\tdplotsinandcos }[3]{\pgfmathsetmacro {#1}{sin(#3)}\pgfmathsetmacro {#2}{cos(#3)}} \newcommand {\tdplotmult }[3]{\pgfmathsetmacro {#1}{#2*#3}} \newcommand {\tdplotdiv }[3]{\pgfmathsetmacro {#1}{#2/#3}} \newcommand {\tdplotcheckdiff }[5]{\par \par \pgfmathparse { abs(#2 -#1)<#3 } \par \ifthenelse {\equal {\pgfmathresult }{1}}{#4}{#5} } \newcommand {\tdplotsetmaincoords }[2]{\pgfmathsetmacro {\tdplotmaintheta }{#1} \pgfmathsetmacro {\tdplotmainphi }{#2} \tdplotcalctransformmainscreen \tikzset {tdplot_main_coords/.style={x={(\raarot cm,\rbarot cm)},y={(\rabrot cm,\rbbrot cm)},z={(\racrot cm,\rbcrot cm)}}}} \newcommand {\tdplotcalctransformmainscreen }[0]{\tdplotsinandcos {\sintheta }{\costheta }{\tdplotmaintheta }\tdplotsinandcos {\sinphi }{\cosphi }{\tdplotmainphi }\tdplotmult {\stsp }{\sintheta }{\sinphi }\tdplotmult {\stcp }{\sintheta }{\cosphi }\tdplotmult {\ctsp }{\costheta }{\sinphi }\tdplotmult {\ctcp }{\costheta }{\cosphi }\pgfmathsetmacro {\raarot }{\cosphi }\pgfmathsetmacro {\rabrot }{\sinphi }\pgfmathsetmacro {\racrot }{0}\pgfmathsetmacro {\rbarot }{-\ctsp }\pgfmathsetmacro {\rbbrot }{\ctcp }\pgfmathsetmacro {\rbcrot }{\sintheta }\pgfmathsetmacro {\rcarot }{\stsp }\pgfmathsetmacro {\rcbrot }{-\stcp }\pgfmathsetmacro {\rccrot }{\costheta }} \newcommand {\tdplotcalctransformrotmain }[0]{\tdplotsinandcos {\sinalpha }{\cosalpha }{\tdplotalpha } \tdplotsinandcos {\sinbeta }{\cosbeta }{\tdplotbeta } \tdplotsinandcos {\singamma }{\cosgamma }{\tdplotgamma } \tdplotmult {\sasb }{\sinalpha }{\sinbeta } \tdplotmult {\sbsg }{\sinbeta }{\singamma } \tdplotmult {\sasg }{\sinalpha }{\singamma } \tdplotmult {\sasbsg }{\sasb }{\singamma } \tdplotmult {\sacb }{\sinalpha }{\cosbeta } \tdplotmult {\sacg }{\sinalpha }{\cosgamma } \tdplotmult {\sbcg }{\sinbeta }{\cosgamma } \tdplotmult {\sacbsg }{\sacb }{\singamma } \tdplotmult {\sacbcg }{\sacb }{\cosgamma } \tdplotmult {\casb }{\cosalpha }{\sinbeta } \tdplotmult {\cacb }{\cosalpha }{\cosbeta } \tdplotmult {\cacg }{\cosalpha }{\cosgamma } \tdplotmult {\casg }{\cosalpha }{\singamma } \tdplotmult {\cacbsg }{\cacb }{\singamma } \tdplotmult {\cacbcg }{\cacb }{\cosgamma } \pgfmathsetmacro {\raaeul }{\cacbcg -\sasg } \pgfmathsetmacro {\rabeul }{-\cacbsg -\sacg } \pgfmathsetmacro {\raceul }{\casb } \pgfmathsetmacro {\rbaeul }{\sacbcg + \casg } \pgfmathsetmacro {\rbbeul }{-\sacbsg + \cacg } \pgfmathsetmacro {\rbceul }{\sasb } \pgfmathsetmacro {\rcaeul }{-\sbcg } \pgfmathsetmacro {\rcbeul }{\sbsg } \pgfmathsetmacro {\rcceul }{\cosbeta } } \newcommand {\tdplotcalctransformmainrot }[0]{\tdplotsinandcos {\sinalpha }{\cosalpha }{\tdplotalpha } \tdplotsinandcos {\sinbeta }{\cosbeta }{\tdplotbeta } \tdplotsinandcos {\singamma }{\cosgamma }{\tdplotgamma } \tdplotmult {\sasb }{\sinalpha }{\sinbeta } \tdplotmult {\sbsg }{\sinbeta }{\singamma } \tdplotmult {\sasg }{\sinalpha }{\singamma } \tdplotmult {\sasbsg }{\sasb }{\singamma } \tdplotmult {\sacb }{\sinalpha }{\cosbeta } \tdplotmult {\sacg }{\sinalpha }{\cosgamma } \tdplotmult {\sbcg }{\sinbeta }{\cosgamma } \tdplotmult {\sacbsg }{\sacb }{\singamma } \tdplotmult {\sacbcg }{\sacb }{\cosgamma } \tdplotmult {\casb }{\cosalpha }{\sinbeta } \tdplotmult {\cacb }{\cosalpha }{\cosbeta } \tdplotmult {\cacg }{\cosalpha }{\cosgamma } \tdplotmult {\casg }{\cosalpha }{\singamma } \tdplotmult {\cacbsg }{\cacb }{\singamma } \tdplotmult {\cacbcg }{\cacb }{\cosgamma } \pgfmathsetmacro {\raaeul }{\cacbcg -\sasg } \pgfmathsetmacro {\rabeul }{\sacbcg + \casg } \pgfmathsetmacro {\raceul }{-\sbcg } \pgfmathsetmacro {\rbaeul }{-\cacbsg -\sacg } \pgfmathsetmacro {\rbbeul }{-\sacbsg + \cacg } \pgfmathsetmacro {\rbceul }{\sbsg } \pgfmathsetmacro {\rcaeul }{\casb } \pgfmathsetmacro {\rcbeul }{\sasb } \pgfmathsetmacro {\rcceul }{\cosbeta } } \newcommand {\tdplottransformmainrot }[3]{\tdplotcalctransformmainrot \par \pgfmathsetmacro {\tdplotresx }{\raaeul * #1 + \rabeul * #2 + \raceul * #3} \pgfmathsetmacro {\tdplotresy }{\rbaeul * #1 + \rbbeul * #2 + \rbceul * #3} \pgfmathsetmacro {\tdplotresz }{\rcaeul * #1 + \rcbeul * #2 + \rcceul * #3} } \newcommand {\tdplottransformrotmain }[3]{\tdplotcalctransformrotmain \par \pgfmathsetmacro {\tdplotresx }{\raaeul * #1 + \rabeul * #2 + \raceul * #3} \pgfmathsetmacro {\tdplotresy }{\rbaeul * #1 + \rbbeul * #2 + \rbceul * #3} \pgfmathsetmacro {\tdplotresz }{\rcaeul * #1 + \rcbeul * #2 + \rcceul * #3} } \newcommand {\tdplottransformmainscreen }[3]{\tdplotcalctransformmainscreen \par \pgfmathsetmacro {\tdplotresx }{\raarot * #1 + \rabrot * #2 + \racrot * #3} \pgfmathsetmacro {\tdplotresy }{\rbarot * #1 + \rbbrot * #2 + \rbcrot * #3} } \newcommand {\tdplotsetrotatedcoords }[3]{\pgfmathsetmacro {\tdplotalpha }{#1} \pgfmathsetmacro {\tdplotbeta }{#2} \pgfmathsetmacro {\tdplotgamma }{#3} \tdplotcalctransformrotmain \par \tdplotmult {\raaeaa }{\raarot }{\raaeul } \tdplotmult {\rabeba }{\rabrot }{\rbaeul } \tdplotmult {\raceca }{\racrot }{\rcaeul } \tdplotmult {\raaeab }{\raarot }{\rabeul } \tdplotmult {\rabebb }{\rabrot }{\rbbeul } \tdplotmult {\racecb }{\racrot }{\rcbeul } \tdplotmult {\raaeac }{\raarot }{\raceul } \tdplotmult {\rabebc }{\rabrot }{\rbceul } \tdplotmult {\racecc }{\racrot }{\rcceul } \tdplotmult {\rbaeaa }{\rbarot }{\raaeul } \tdplotmult {\rbbeba }{\rbbrot }{\rbaeul } \tdplotmult {\rbceca }{\rbcrot }{\rcaeul } \tdplotmult {\rbaeab }{\rbarot }{\rabeul } \tdplotmult {\rbbebb }{\rbbrot }{\rbbeul } \tdplotmult {\rbcecb }{\rbcrot }{\rcbeul } \tdplotmult {\rbaeac }{\rbarot }{\raceul } \tdplotmult {\rbbebc }{\rbbrot }{\rbceul } \tdplotmult {\rbcecc }{\rbcrot }{\rcceul } \pgfmathsetmacro {\raarc }{\raaeaa + \rabeba + \raceca } \pgfmathsetmacro {\rabrc }{\raaeab + \rabebb + \racecb } \pgfmathsetmacro {\racrc }{\raaeac + \rabebc + \racecc } \pgfmathsetmacro {\rbarc }{\rbaeaa + \rbbeba + \rbceca } \pgfmathsetmacro {\rbbrc }{\rbaeab + \rbbebb + \rbcecb } \pgfmathsetmacro {\rbcrc }{\rbaeac + \rbbebc + \rbcecc } \tikzset {tdplot_rotated_coords/.append style={x={(\raarc cm,\rbarc cm)},y={(\rabrc cm,\rbbrc cm)},z={(\racrc cm,\rbcrc cm)}}}} \newcommand {\tdplotsetrotatedcoordsorigin }[1]{\tikzset {tdplot_rotated_coords/.append style={shift=#1}}} \newcommand {\tdplotresetrotatedcoordsorigin }[0]{\tikzset {tdplot_rotated_coords/.append style={shift={(0,0,0)}}}} \newcommand {\tdplotsetthetaplanecoords }[1]{\tdplotresetrotatedcoordsorigin \tdplotsetrotatedcoords {270 + #1}{270}{0}} \newcommand {\tdplotsetrotatedthetaplanecoords }[1]{\tdplotsetrotatedcoords {\tdplotalpha }{\tdplotbeta }{\tdplotgamma + #1}\tikzset {tdplot_rotated_coords/.append style={y={(\raarc cm,\rbarc cm)},z={(\rabrc cm,\rbbrc cm)},x={(\racrc cm,\rbcrc cm)}}}} \newcommand {\tdplotsetcoord }[4]{\tdplotsinandcos {\sinthetavec }{\costhetavec }{#3}\tdplotsinandcos {\sinphivec }{\cosphivec }{#4}\tdplotmult {\stcpv }{\sinthetavec }{\cosphivec }\tdplotmult {\stspv }{\sinthetavec }{\sinphivec }\coordinate (#1) at ($#2*(\stcpv ,\stspv ,\costhetavec )$); \coordinate (#1xy) at ($#2*(\stcpv ,\stspv ,0)$); \coordinate (#1xz) at ($#2*(\stcpv ,0,\costhetavec )$); \coordinate (#1yz) at ($#2*(0,\stspv ,\costhetavec )$); \coordinate (#1x) at ($#2*(\stcpv ,0,0)$); \coordinate (#1y) at ($#2*(0,\stspv ,0)$); \coordinate (#1z) at ($#2*(0,0,\costhetavec )$); } \newcommand {\tdplotsimplesetcoord }[4]{\tdplotsinandcos {\sinthetavec }{\costhetavec }{#3}\tdplotsinandcos {\sinphivec }{\cosphivec }{#4}\tdplotmult {\stcpv }{\sinthetavec }{\cosphivec }\tdplotmult {\stspv }{\sinthetavec }{\sinphivec }\coordinate (#1) at ($#2*(\stcpv ,\stspv ,\costhetavec )$); } \newcommand {\tdplotsetpolarplotrange }[4]{\pgfmathsetmacro {\tdplotlowerphi }{#3} \pgfmathsetmacro {\tdplotupperphi }{#4} \pgfmathsetmacro {\tdplotlowertheta }{#1} \pgfmathsetmacro {\tdplotuppertheta }{#2} } \newcommand {\tdplotresetpolarplotrange }[0]{\pgfmathsetmacro {\tdplotlowerphi }{0} \pgfmathsetmacro {\tdplotupperphi }{360} \pgfmathsetmacro {\tdplotlowertheta }{0} \pgfmathsetmacro {\tdplotuppertheta }{180} } \newcommand {\tdplotdosurfaceplot }[6]{\par \pgfmathsetmacro {\nextphi }{\curphi + \tdplotsuperfudge *\viewphistep } \par \begin {scope}[opacity=1] \par \par \tdplotcheckdiff {\nextphi }{360}{\origviewphistep }{#2}{} \tdplotcheckdiff {\nextphi }{0}{\origviewphistep }{#2}{} \par \tdplotcheckdiff {\nextphi }{90}{\origviewphistep }{#3}{} \tdplotcheckdiff {\nextphi }{450}{\origviewphistep }{#3}{} \end {scope} \par \foreach \curtheta in{\viewthetastart ,\viewthetainc ,...,\viewthetaend } { \par \pgfmathsetmacro {\curlongitude }{90 -\curphi } \pgfmathsetmacro {\curlatitude }{90 -\curtheta } \par \ifthenelse {\equal {\leftright }{-1.0}}{\pgfmathsetmacro {\curphi }{\curphi -\origviewphistep } }{} \par \pgfmathsetmacro {\tdplottheta }{mod(\curtheta ,360)} \pgfmathsetmacro {\tdplotphi }{mod(\curphi ,360)} \par \pgfmathparse {\tdplotphi <0} \ifthenelse {\equal {\pgfmathresult }{1}}{ \pgfmathsetmacro {\tdplotphi }{\tdplotphi + 360} }{}\par \pgfmathparse {\tdplottheta >\tdplotuppertheta } \pgfmathsetmacro {\logictest }{1 -\pgfmathresult } \par \pgfmathparse {\tdplottheta <\tdplotlowertheta } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathsetmacro {\tdplottheta }{\tdplottheta + \viewthetastep } \pgfmathparse {\tdplottheta >\tdplotuppertheta } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathparse {\tdplottheta <\tdplotlowertheta } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathparse {\tdplotphi >\tdplotupperphi } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathparse {\tdplotphi <\tdplotlowerphi } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathsetmacro {\tdplotphi }{\tdplotphi + \viewphistep } \par \pgfmathparse {\tdplotphi <0} \ifthenelse {\equal {\pgfmathresult }{1}}{ \pgfmathsetmacro {\tdplotphi }{\tdplotphi + 360} }{}\par \pgfmathparse {\tdplotphi >\tdplotupperphi } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \pgfmathparse {\tdplotphi <\tdplotlowerphi } \pgfmathsetmacro {\logictest }{\logictest * (1 -\pgfmathresult )} \par \par \pgfmathsetmacro {\tdplottheta }{\curtheta } \pgfmathsetmacro {\tdplotphi }{\curphi } \par \ifthenelse {\equal {#6}{parametricfill}}{\ifthenelse {\equal {\logictest }{1.0}}{\pgfmathsetmacro {\radius }{#1} \pgfmathsetmacro {\tdplotr }{\radius *360} \par \pgfmathlessthan {\radius }{0} \pgfmathsetmacro {\phaseshift }{180 * \pgfmathresult } \par \pgfmathsetmacro {\colorarg }{#5} \pgfmathsetmacro {\colorarg }{\colorarg + \phaseshift } \pgfmathsetmacro {\colorarg }{mod(\colorarg ,360)} \par \pgfmathlessthan {\colorarg }{0} \pgfmathsetmacro {\colorarg }{\colorarg + 360*\pgfmathresult } \par \pgfmathdivide {\colorarg }{360} \definecolor {tdplotfillcolor}{hsb}{\pgfmathresult ,1,1} \color {tdplotfillcolor} }{}}{\pgfsetfillcolor {#5} } \pgfsetstrokecolor {#4} \par \ifthenelse {\equal {\leftright }{-1.0}}{\pgfmathsetmacro {\curphi }{\curphi + \origviewphistep } }{} \par \ifthenelse {\equal {\logictest }{1.0}}{\pgfmathsetmacro {\radius }{abs(#1)} \pgfpathmoveto {\pgfpointspherical {\curlongitude }{\curlatitude }{\radius }} \par \pgfmathsetmacro {\tdplotphi }{\curphi + \viewphistep } \pgfmathsetmacro {\radius }{abs(#1)} \pgfpathlineto {\pgfpointspherical {\curlongitude -\viewphistep }{\curlatitude }{\radius }} \par \pgfmathsetmacro {\tdplottheta }{\curtheta + \viewthetastep } \pgfmathsetmacro {\radius }{abs(#1)} \pgfpathlineto {\pgfpointspherical {\curlongitude -\viewphistep }{\curlatitude -\viewthetastep }{\radius }} \par \pgfmathsetmacro {\tdplotphi }{\curphi } \pgfmathsetmacro {\radius }{abs(#1)} \pgfpathlineto {\pgfpointspherical {\curlongitude }{\curlatitude -\viewthetastep }{\radius }} \pgfpathclose \par \pgfusepath {fill,stroke} }{} } } \newcommand {\tdplotshowargcolorguide }[4]{ \par \pgfmathsetmacro {\tdplotx }{#1} \pgfmathsetmacro {\tdploty }{#2} \pgfmathsetmacro {\tdplothuestep }{5} \pgfmathsetmacro {\tdplotxsize }{#3} \pgfmathsetmacro {\tdplotysize }{#4} \par \pgfmathsetmacro {\tdplotyscale }{\tdplotysize /360} \par \foreach \tdplotphi in {0,\tdplothuestep ,...,360} { \pgfmathdivide {\tdplotphi }{360} \definecolor {tdplotfillcolor}{hsb}{\pgfmathresult ,1,1} \color {tdplotfillcolor} \par \pgfmathsetmacro {\tdplotstarty }{\tdploty + \tdplotphi * \tdplotyscale } \pgfmathsetmacro {\tdplotstopy }{\tdplotstarty + \tdplothuestep * \tdplotyscale } \pgfmathsetmacro {\tdplotstartx }{\tdplotx } \pgfmathsetmacro {\tdplotstopx }{\tdplotx + \tdplotxsize } \filldraw [tdplot_screen_coords] (\tdplotstartx ,\tdplotstarty ) rectangle (\tdplotstopx ,\tdplotstopy ); } \par \pgfmathsetmacro {\tdplotstopy }{\tdploty + (360+\tdplothuestep )*\tdplotyscale } \pgfmathsetmacro {\tdplotstopx }{\tdplotx + \tdplotxsize } \par \draw [tdplot_screen_coords] (\tdplotx ,\tdploty ) rectangle (\tdplotstopx ,\tdplotstopy ); \par \node [tdplot_screen_coords,anchor=west,xshift=5pt] at (\tdplotstopx ,\tdploty ) {$0$}; \node [tdplot_screen_coords,anchor=west,xshift=5pt] at (\tdplotstopx ,\tdplotstopy ) {$2\pi $}; \par \pgfmathsetmacro {\tdplotstopy }{\tdploty + (360+\tdplothuestep )/2*\tdplotyscale } \node [tdplot_screen_coords,anchor=west,xshift=5pt] at (\tdplotstopx ,\tdplotstopy ) {$\pi $}; } \newcommand {\tdplotgetpolarcoords }[3]{\pgfmathsetmacro {\vxcalc }{#1} \pgfmathsetmacro {\vycalc }{#2} \pgfmathsetmacro {\vzcalc }{#3} \pgfmathsetmacro {\vcalc }{ sqrt((\vxcalc )^2 + (\vycalc )^2 + (\vzcalc )^2) } \par \pgfmathsetmacro {\vxycalc }{ sqrt((\vxcalc )^2 + (\vycalc )^2) } \par \pgfmathsetmacro {\tdplotrestheta }{asin(\vxycalc /\vcalc )} \pgfmathparse {\vzcalc <0} \ifthenelse {\equal {\pgfmathresult }{1}}{\pgfmathsetmacro {\tdplotrestheta }{180 -\tdplotrestheta } } {} \ifthenelse {\equal {\vxcalc }{0.0}}{\pgfmathparse {\vycalc <0} \ifthenelse {\equal {\pgfmathresult }{1}}{\pgfmathsetmacro {\tdplotresphi }{270} } {\pgfmathparse {\vycalc >0} \ifthenelse {\equal {\pgfmathresult }{1}}{\pgfmathsetmacro {\tdplotresphi }{90} } {\pgfmathsetmacro {\tdplotresphi }{0} } } } {\pgfmathsetmacro {\tdplotresphi }{atan(\vycalc /\vxcalc )} \pgfmathparse {\vxcalc <0} \ifthenelse {\equal {\pgfmathresult }{1}}{\pgfmathsetmacro {\tdplotresphi }{\tdplotresphi +180} } { } \par \pgfmathparse {\tdplotresphi <0} \ifthenelse {\equal {\pgfmathresult }{1}}{\pgfmathsetmacro {\tdplotresphi }{\tdplotresphi +360} } {} } } \newcommand {\vec }[0]{\mathbf } \newcommand {\RR }[0]{\mathbb {R}} \newcommand {\dfn }[0]{\textit } \newcommand {\dotp }[0]{\cdot } \newcommand {\id }[0]{\text {id}} \newcommand {\norm }[1]{\left \lVert #1\right \rVert } \newcommand {\mathtoolsset }[1]{\setkeys {\MT_options_name: }{#1}} \newcommand {\refeq }[1]{\textup {\ref {#1}}} \newcommand {\lparen }[0]{(} \newcommand {\rparen }[0]{)} \newcommand {\ordinarycolon }[0]{:} \newcommand {\MT_test_for_tcb_other:nnnnn }[1]{\MH_if:w t#1\relax \expandafter \MH_use_choice_i:nnnn \MH_else: \MH_if:w c#1\relax \expandafter \expandafter \expandafter \MH_use_choice_ii:nnnn \MH_else: \MH_if:w b#1\relax \expandafter \expandafter \expandafter \expandafter \expandafter \expandafter \expandafter \MH_use_choice_iii:nnnn \MH_else: \expandafter \expandafter \expandafter \expandafter \expandafter \expandafter \expandafter \MH_use_choice_iv:nnnn \MH_fi: \MH_fi: \MH_fi: } \newcommand {\newcases }[6]{\newenvironment {#1}{\MT_start_cases:nnnn {#2}{#3}{#4}{#5}}{\MH_end_cases: \right #6}} \newcommand {\renewcases }[6]{\renewenvironment {#1}{\MT_start_cases:nnnn {#2}{#3}{#4}{#5}}{\MH_end_cases: \right #6}} \newcommand {\SwapAboveDisplaySkip }[0]{\noalign {\vskip -\abovedisplayskip \vskip \abovedisplayshortskip }} \newcommand {\vdotswithin }[1]{{\mathmakebox [\widthof {\ensuremath {{}#1{}}}][c]{{\vdots }}}} \newcommand {\MTFlushSpaceBelow }[0]{\\\noalign {\nobreak \vskip -\lineskip \vskip -\l_MT_shortvdotswithinadjustbelow_dim \vskip -\origjot \vskip \jot }} \newcommand {\mathmbox }[0]{\mathpalette \MT_mathmbox:nn } \newcommand {\crampedsubstack }[1]{\crampedsubarray {c}#1\endcrampedsubarray } \newcommand {\prescript }[3]{\mathchoice {\MT_prescript_inner: {#1}{#2}{#3}{\scriptstyle }}{\MT_prescript_inner: {#1}{#2}{#3}{\scriptstyle }}{\MT_prescript_inner: {#1}{#2}{#3}{\scriptscriptstyle }}{\MT_prescript_inner: {#1}{#2}{#3}{\scriptscriptstyle }}} \newcommand {\spreadlines }[1]{\setlength {\jot }{#1}\ignorespaces } \newcommand {\newgathered }[4]{\newenvironment {#1}{\def \MT_gathered_pre: {#2}\def \MT_gathered_post: {#3}\def \MT_gathered_env_end: {#4}\MT_gathered_env }{\endMT_gathered_env }} \newcommand {\renewgathered }[4]{\renewenvironment {#1}{\def \MT_gathered_pre: {#2}\def \MT_gathered_post: {#3}\def \MT_gathered_env_end: {#4}\MT_gathered_env }{\endMT_gathered_env }} \newcommand {\lgathered }[0]{\def \MT_gathered_pre: {}\def \MT_gathered_post: {\hfil }\def \MT_gathered_env_end: {}\MT_gathered_env } \newcommand {\rgathered }[0]{\def \MT_gathered_pre: {\hfil }\def \MT_gathered_post: {}\def \MT_gathered_env_end: {}\MT_gathered_env } \newcommand {\gathered }[0]{\def \MT_gathered_pre: {\hfil }\def \MT_gathered_post: {\hfil }\def \MT_gathered_env_end: {}\MT_gathered_env } \newcommand {\splitfrac }[2]{\genfrac {}{}{0pt}{1}{\textstyle #1\quad \hfill }{\textstyle \hfill \quad \mathstrut #2}} \newcommand {\splitdfrac }[2]{\genfrac {}{}{0pt}{0}{#1\quad \hfill }{\hfill \quad \mathstrut #2}} \newcommand {\dblcolon }[0]{\vcentcolon \mathrel {\mkern -.9mu}\vcentcolon } \newcommand {\coloneqq }[0]{\vcentcolon \mathrel {\mkern -1.2mu}=} \newcommand {\Coloneqq }[0]{\dblcolon \mathrel {\mkern -1.2mu}=} \newcommand {\coloneq }[0]{\vcentcolon \mathrel {\mkern -1.2mu}\mathrel {-}} \newcommand {\Coloneq }[0]{\dblcolon \mathrel {\mkern -1.2mu}\mathrel {-}} \newcommand {\eqqcolon }[0]{=\mathrel {\mkern -1.2mu}\vcentcolon } \newcommand {\Eqqcolon }[0]{=\mathrel {\mkern -1.2mu}\dblcolon } \newcommand {\eqcolon }[0]{\mathrel {-}\mathrel {\mkern -1.2mu}\vcentcolon } \newcommand {\Eqcolon }[0]{\mathrel {-}\mathrel {\mkern -1.2mu}\dblcolon } \newcommand {\colonapprox }[0]{\vcentcolon \mathrel {\mkern -1.2mu}\approx } \newcommand {\Colonapprox }[0]{\dblcolon \mathrel {\mkern -1.2mu}\approx } \newcommand {\colonsim }[0]{\vcentcolon \mathrel {\mkern -1.2mu}\sim } \newcommand {\Colonsim }[0]{\dblcolon \mathrel {\mkern -1.2mu}\sim } \newcommand {\nuparrow }[0]{\MH_nuparrow: } \newcommand {\ndownarrow }[0]{\MH_ndownarrow: } \newcommand {\bigtimes }[0]{\MH_csym_bigtimes: }$

SVD Decomposition

We begin this section with an important definition.

Let $A$ be an $m\times n$ matrix. The singular values of $A$ are the square roots of the positive eigenvalues of $A^TA.$

Singular Value Decomposition (SVD) can be thought of as a generalization of orthogonal diagonalization of a symmetric matrix to an arbitrary $m\times n$ matrix. This decomposition is the focus of this section.

The following is a useful result that will help when computing the SVD of matrices.

Let $A$ be an $m \times n$ matrix. Then $A^TA$ and $AA^T$ have the same nonzero eigenvalues.

Proof: Suppose $A$ is an $m\times n$ matrix, and suppose that $\lambda$ is a nonzero eigenvalue of $A^TA$ . Then there exists a nonzero vector $\vec {x} \in \RR ^n$ such that $\begin{equation} \label{nonzero} (A^TA)\vec{x}=\lambda \vec{x} \end{equation}$ Multiplying both sides of this equation by $A$ yields:
$\begin{eqnarray*} A(A^TA)\vec{x} & = & A\lambda \vec{x}\\ (AA^T)(A\vec{x}) & = & \lambda (A\vec{x}) \end{eqnarray*}$
Since $\lambda \neq 0$ and $\vec {x}\neq 0_n$ , $\lambda \vec {x}\neq 0_n$ , and thus by equation (nonzero), $(A^TA)\vec {x}\neq 0_m$ ; thus $A^T(A\vec {x})\neq 0_m$ , implying that $A\vec {x}\neq 0_m$ .
Therefore $A\vec {x}$ is an eigenvector of $AA^T$ corresponding to eigenvalue $\lambda$ . An analogous argument can be used to show that every nonzero eigenvalue of $AA^T$ is an eigenvalue of $A^TA$ , thus completing the proof. $\blacksquare$

Given an $m\times n$ matrix $A$ , we will see how to express $A$ as a product $A=U\Sigma V^T$ where

$U$ is an $m\times m$ orthogonal matrix whose columns are eigenvectors of $AA^T$ .
$V$ is an $n\times n$ orthogonal matrix whose columns are eigenvectors of $A^TA$ .
$\Sigma$ is an $m\times n$ matrix whose only nonzero values lie on its main diagonal, and are the singular values of $A$ .

How can we find such a decomposition? We are aiming to decompose $A$ in the following form: $\begin{equation*} A=U\left [ \begin{array}{cc} \sigma & 0 \\ 0 & 0 \end{array} \right ] V^T \end{equation*}$ where $\sigma$ is a block matrix of the form $\sigma =\left [ \begin {array}{ccc} \sigma _{1} & & 0 \\ & \ddots & \\ 0 & & \sigma _{k} \end {array} \right ]$ Thus $A^T=V\left [ \begin {array}{cc} \sigma & 0 \\ 0 & 0 \end {array} \right ] U^T$ and it follows that $\begin{equation*} A^TA=V\left [ \begin{array}{cc} \sigma & 0 \\ 0 & 0 \end{array} \right ] U^TU\left [ \begin{array}{cc} \sigma & 0 \\ 0 & 0 \end{array} \right ] V^T=V\left [ \begin{array}{cc} \sigma ^{2} & 0 \\ 0 & 0 \end{array} \right ] V^T \end{equation*}$ and so $A^TAV=V\left [ \begin {array}{cc} \sigma ^{2} & 0 \\ 0 & 0 \end {array} \right ] .$ Similarly, $AA^TU=U\left [ \begin {array}{cc} \sigma ^{2} & 0 \\ 0 & 0 \end {array} \right ] .$ Therefore, you would find an orthonormal basis of eigenvectors for $AA^T$ make them the columns of a matrix such that the corresponding eigenvalues are decreasing. This gives $U.$ You could then do the same for $A^TA$ to get $V$ .

We formalize this discussion in the following theorem.

Singular Value Decomposition Let $A$ be an $m\times n$ matrix. Then there exist orthogonal matrices $U$ and $V$ of the appropriate size such that $A= U \Sigma V^T$ where $\Sigma$ is of the form $\Sigma = \left [ \begin {array}{cc} \sigma & 0 \\ 0 & 0 \end {array} \right ]$ and $\sigma$ is a block matrix of the form $\sigma =\left [ \begin {array}{ccc} \sigma _{1} & & 0 \\ & \ddots & \\ 0 & & \sigma _{k} \end {array} \right ]$ for the $\sigma _{i}$ the singular values of $A.$

Proof: There exists an orthonormal basis, $\left \{ \vec {v}_{1}, \dots , \vec {v}_n\right \}$ such that $A^TA\vec {v}_{i}=\sigma _{i}^{2}\vec {v}_{i}$ where $\sigma _{i}^{2}>0$ for $i=1,\dots ,k,\left ( \sigma _{i}>0\right )$ and equals zero if $i>k.$ Thus for $i>k,$ $A\vec {v}_{i}=\vec {0}$ because $\begin{equation*} A\vec{v}_{i}\dotp A\vec{v}_{i} = (A\vec{v}_i)^T(A\vec{v}_i)=\vec{v}_i^T(A^TA\vec{v}_i)=\vec{0} \end{equation*}$ For $i=1,\dots ,k,$ define $\vec {u}_{i}\in \RR ^{m}$ by $\begin{equation*} \vec{u}_{i}= \sigma _{i}^{-1}A\vec{v}_{i} \end{equation*}$ Thus $A\vec {v}_{i}=\sigma _{i}\vec {u}_{i}.$ Now
$\begin{eqnarray*} \vec{u}_{i} \dotp \vec{u}_{j} &=& \sigma _{i}^{-1}A \vec{v}_{i} \dotp \sigma _{j}^{-1}A\vec{v}_{j} = \sigma _{i}^{-1}\vec{v}_{i}^T \sigma _{j}^{-1}A^TA\vec{v}_{j} \\ &=& \sigma _{i}^{-1}\vec{v}_{i} \dotp \sigma _{j}^{-1}\sigma _{j}^{2} \vec{v}_{j} = \frac{\sigma _{j}}{\sigma _{i}}\left ( \vec{v}_{i} \dotp \vec{v}_{j}\right ) \end{eqnarray*}$
This means that $\vec {u}_{i} \dotp \vec {u}_{j}=1$ when $i=j$ and $\vec {u}_{i} \dotp \vec {u}_{j}=0$ when $i\neq j$ . Thus $\left \{ \vec {u}_{1}, \dots , \vec {u}_{k}\right \}$ is an orthonormal set of vectors in $\RR ^{m}.$ Also, $\begin{equation*} AA^T\vec{u}_{i}=AA^T\sigma _{i}^{-1}A\vec{v}_{i}=\sigma _{i}^{-1}AA^TA\vec{v}_{i}=\sigma _{i}^{-1}A\sigma _{i}^{2}\vec{v} _{i}=\sigma _{i}^{2}\vec{u}_{i} \end{equation*}$ Now, using Gram-Schmidt, extend $\left \{ \vec {u}_{1}, \dots , \vec {u}_{k}\right \}$ to an orthonormal basis for all of $\RR ^{m},\left \{ \vec {u}_{1},\dots ,\vec {u}_{m}\right \}$ and let $\begin{equation*} U= \left [ \begin{array}{ccc} \vec{u}_{1} & \cdots & \vec{u}_{m} \end{array} \right ] \end{equation*}$ while $V= \left [ \begin {array}{ccc} \vec {v}_{1} & \cdots & \vec {v}_{n}\end {array}\right ] .$ Thus $U$ is the matrix which has the $\vec {u}_{i}$ as columns and $V$ is defined as the matrix which has the $\vec {v}_{i}$ as columns. Then $\begin{equation*} U^TAV=\left [ \begin{array}{c} \vec{u}_{1}^T \\ \vdots \\ \vec{u}_{k}^T \\ \vdots \\ \vec{u}_{m}^T \end{array} \right ] A \left [ \begin{array}{ccc} \vec{v}_{1} & \cdots & \vec{v}_{n}\end{array}\right ] \end{equation*}$ $\begin{equation*} =\left [ \begin{array}{c} \vec{u}_{1}^T \\ \vdots \\ \vec{u}_{k}^T \\ \vdots \\ \vec{u}_{m}^T \end{array} \right ] \left [ \begin{array}{cccccc} \sigma _{1}\vec{u}_{1} & \cdots & \sigma _{k}\vec{u}_{k} & \vec{0} & \cdots & \vec{0} \end{array} \right ] =\left [ \begin{array}{cc} \sigma & 0 \\ 0 & 0 \end{array} \right ] \end{equation*}$ where $\sigma$ is given in the statement of the theorem. $\blacksquare$

The SVD has as an immediate corollary which is given in the following interesting result.

Let $A$ be an $m\times n$ matrix. Then the rank of $A$ (or of $A^T$ ) equals the number of singular values.

Let’s compute the SVD of a simple matrix.

Let $A=\left [\begin {array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end {array}\right ]$ . Find the SVD of $A$ .

To begin, we compute $AA^T$ and $A^TA$ . $AA^T = \left [\begin {array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end {array}\right ] \left [\begin {array}{rr} 1 & 3 \\ -1 & 1 \\ 3 & 1 \end {array}\right ] = \left [\begin {array}{rr} 11 & 5 \\ 5 & 11 \end {array}\right ]$

$A^TA = \left [\begin {array}{rr} 1 & 3 \\ -1 & 1 \\ 3 & 1 \end {array}\right ] \left [\begin {array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end {array}\right ] = \left [\begin {array}{rrr} 10 & 2 & 6 \\ 2 & 2 & -2\\ 6 & -2 & 10 \end {array}\right ]$ Since $AA^T$ is $2\times 2$ while $A^T A$ is $3\times 3$ , and $AA^T$ and $A^TA$ have the same nonzero eigenvalues (by Lemma lem:samenonzeroeigenvalues), we compute the characteristic polynomial $c_{AA^T}(x)$ (because it is easier to compute than $c_{A^TA}(x)$ ).

$\begin{eqnarray*} c_{AA^T}(z)& = &\det (zI-AA^T)= \det \left [\begin{array}{cc} z-11 & -5 \\ -5 & z-11 \end{array}\right ]\\ & = &(z-11)^2 - 25 \\ & = & z^2-22z+121-25\\ & = & z^2-22z+96\\ & = & (z-16)(z-6) \end{eqnarray*}$

Therefore, the eigenvalues of $AA^T$ are $\lambda _1=16$ and $\lambda _2=6$ .

The eigenvalues of $A^TA$ are $\lambda _1=16$ , $\lambda _2=6$ , and $\lambda _3=0$ , and the singular values of $A$ are $\sigma _1=\sqrt {16}=4$ and $\sigma _2=\sqrt {6}$ . By convention, we list the eigenvalues (and corresponding singular values) in non increasing order (i.e., from largest to smallest).

To find the matrix $V$ :

To construct the matrix $V$ we need to find eigenvectors for $A^TA$ . Since the eigenvalues of $AA^T$ are distinct, the corresponding eigenvectors are orthogonal, and we need only normalize them.

$\lambda _1=16$ : solve $(16I-A^TA)\vec {x}_1= \vec {0}$ .

$\left [\begin {array}{rrr|r} 6 & -2 & -6 & 0 \\ -2 & 14 & 2 & 0 \\ -6 & 2 & 6 & 0 \end {array}\right ] \rightarrow \left [\begin {array}{rrr|r} 1 & 0 & -1 & 0 \\ 0 & 1 & 0 & 0 \\ 0 & 0 & 0 & 0 \end {array}\right ], \mbox { so } \vec {x}_1 =\left [\begin {array}{r} t \\ 0 \\ t \end {array}\right ] =t\left [\begin {array}{r} 1 \\ 0 \\ 1 \end {array}\right ], t\in \RR .$

$\lambda _2=6$ : solve $(6I-A^TA)\vec {x}_2= \vec {0}$ .

$\left [\begin {array}{rrr|r} -4 & -2 & -6 & 0 \\ -2 & 4 & 2 & 0 \\ -6 & 2 & -4 & 0 \end {array}\right ] \rightarrow \left [\begin {array}{rrr|r} 1 & 0 & 1 & 0 \\ 0 & 1 & 1 & 0 \\ 0 & 0 & 0 & 0 \end {array}\right ], \mbox { so } \vec {x}_2=\left [\begin {array}{r} -s \\ -s \\ s \end {array}\right ] =s\left [\begin {array}{r} -1 \\ -1 \\ 1 \end {array}\right ], s\in \RR .$

$\lambda _3=0$ : solve $(-A^TA)\vec {x}_3= \vec {0}$ . $\left [\begin {array}{rrr|r} -10 & -2 & -6 & 0 \\ -2 & -2 & 2 & 0 \\ -6 & 2 & -10 & 0 \end {array}\right ] \rightarrow \left [\begin {array}{rrr|r} 1 & 0 & 1 & 0 \\ 0 & 1 & -2 & 0 \\ 0 & 0 & 0 & 0 \end {array}\right ], \mbox { so } \vec {x}_3=\left [\begin {array}{r} -r \\ 2r \\ r \end {array}\right ] =r\left [\begin {array}{r} -1 \\ 2 \\ 1 \end {array}\right ], r\in \RR .$ Let $\vec {v}_1=\frac {1}{\sqrt {2}}\left [\begin {array}{r} 1\\ 0\\ 1 \end {array}\right ], \vec {v}_2=\frac {1}{\sqrt {3}}\left [\begin {array}{r} -1\\ -1\\ 1 \end {array}\right ], \vec {v}_3=\frac {1}{\sqrt {6}}\left [\begin {array}{r} -1\\ 2\\ 1 \end {array}\right ]$ Then $V=\frac {1}{\sqrt {6}}\left [\begin {array}{rrr} \sqrt 3 & -\sqrt 2 & -1 \\ 0 & -\sqrt 2 & 2 \\ \sqrt 3 & \sqrt 2 & 1 \end {array}\right ]$ Also, $\Sigma = \left [\begin {array}{rrr} 4 & 0 & 0 \\ 0 & \sqrt 6 & 0 \end {array}\right ]$ and we use $A$ , $V^T$ , and $\Sigma$ to find $U$ . Since $V$ is orthogonal and $A=U\Sigma V^T$ , it follows that $AV=U\Sigma$ . Let $V=\left [\begin {array}{ccc} \vec {v}_1 & \vec {v}_2 & \vec {v}_3 \end {array}\right ]$ , and let $U=\left [\begin {array}{cc} \vec {u}_1 & \vec {u}_2 \end {array}\right ]$ , where $\vec {u}_1$ and $\vec {u}_2$ are the two columns of $U$ . Then we have

$\begin{eqnarray*} A\left [\begin{array}{ccc} \vec{v}_1 & \vec{v}_2 & \vec{v}_3 \end{array}\right ] &=& \left [\begin{array}{cc} \vec{u}_1 & \vec{u}_2 \end{array}\right ]\Sigma \\ \left [\begin{array}{ccc} A\vec{v}_1 & A\vec{v}_2 & A\vec{v}_3 \end{array}\right ] &=& \left [\begin{array}{ccc} \sigma _1\vec{u}_1 + 0\vec{u}_2 & 0\vec{u}_1 + \sigma _2 \vec{u}_2 & 0 \vec{u}_1 + 0\vec{u}_2 \end{array}\right ] \\ &=& \left [\begin{array}{ccc} \sigma _1\vec{u}_1 & \sigma _2 \vec{u}_2 & 0 \end{array}\right ] \end{eqnarray*}$

which implies that $A\vec {v}_1=\sigma _1\vec {u}_1 = 4\vec {u}_1$ and $A\vec {v}_2=\sigma _2\vec {u}_2 = \sqrt 6 \vec {u}_2$ . Thus, $\vec {u}_1 = \frac {1}{4}A\vec {v}_1 = \frac {1}{4} \left [\begin {array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end {array}\right ] \frac {1}{\sqrt {2}}\left [\begin {array}{r} 1\\ 0\\ 1 \end {array}\right ] = \frac {1}{4\sqrt 2}\left [\begin {array}{r} 4\\ 4 \end {array}\right ] = \frac {1}{\sqrt 2}\left [\begin {array}{r} 1\\ 1 \end {array}\right ]$ and $\vec {u}_2 = \frac {1}{\sqrt 6}A\vec {v}_2 = \frac {1}{\sqrt 6} \left [\begin {array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end {array}\right ] \frac {1}{\sqrt {3}}\left [\begin {array}{r} -1\\ -1\\ 1 \end {array}\right ] =\frac {1}{3\sqrt 2}\left [\begin {array}{r} 3\\ -3 \end {array}\right ] =\frac {1}{\sqrt 2}\left [\begin {array}{r} 1\\ -1 \end {array}\right ]$ Therefore, $U=\frac {1}{\sqrt {2}}\left [\begin {array}{rr} 1 & 1 \\ 1 & -1 \end {array}\right ]$ and

$\begin{eqnarray*} A & = & \left [\begin{array}{rrr} 1 & -1 & 3 \\ 3 & 1 & 1 \end{array}\right ]\\ & = & \left (\frac{1}{\sqrt{2}}\left [\begin{array}{rr} 1 & 1 \\ 1 & -1 \end{array}\right ]\right ) \left [\begin{array}{rrr} 4 & 0 & 0 \\ 0 & \sqrt 6 & 0 \end{array}\right ] \left (\frac{1}{\sqrt{6}}\left [\begin{array}{rrr} \sqrt 3 & 0 & \sqrt 3 \\ -\sqrt 2 & -\sqrt 2 & \sqrt 2 \\ -1 & 2 & 1 \end{array}\right ]\right ) \end{eqnarray*}$

Here is another example.

Find an SVD for $A=\left [\begin {array}{r} -1 \\ 2\\ 2 \end {array}\right ]$ .

Since $A$ is $3\times 1$ , $A^T A$ is a $1\times 1$ matrix whose eigenvalues are easier to find than the eigenvalues of the $3\times 3$ matrix $AA^T$ .

$A^TA=\left [\begin {array}{ccc} -1 & 2 & 2 \end {array}\right ] \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ] =\left [\begin {array}{r} 9 \end {array}\right ]$ Thus $A^TA$ has eigenvalue $\lambda _1=9$ , and the eigenvalues of $AA^T$ are $\lambda _1=9$ , $\lambda _2=0$ , and $\lambda _3=0$ . Furthermore, $A$ has only one singular value, $\sigma _1=3$ .

To find the matrix $V$ : To do so we find an eigenvector for $A^TA$ and normalize it. In this case, finding a unit eigenvector is trivial: $\vec {v}_1=\left [\begin {array}{r} 1 \end {array}\right ]$ , and $V=\left [\begin {array}{r} 1 \end {array}\right ]$ Also, $\Sigma =\left [\begin {array}{r} 3 \\ 0\\ 0 \end {array}\right ]$ , and we use $A$ , $V^T$ , and $\Sigma$ to find $U$ .

Now $AV=U\Sigma$ , with $V=\left [\begin {array}{r}\vec {v}_1 \end {array}\right ]$ , and $U=\left [\begin {array}{rrr} \vec {u}_1 & \vec {u}_2 & \vec {u}_3 \end {array}\right ]$ , where $\vec {u}_1$ , $\vec {u}_2$ , and $\vec {u}_3$ are the columns of $U$ . Thus

$\begin{eqnarray*} A\left [\begin{array}{r} \vec{v}_1 \end{array}\right ] &=& \left [\begin{array}{rrr} \vec{u}_1 & \vec{u}_2 & \vec{u}_3 \end{array}\right ]\Sigma \\ \left [\begin{array}{r} A\vec{v}_1 \end{array}\right ] &=& \left [\begin{array}{r} \sigma _1 \vec{u}_1+0\vec{u}_2+0\vec{u}_3 \end{array}\right ]\\ &=& \left [\begin{array}{r} \sigma _1 \vec{u}_1 \end{array}\right ] \end{eqnarray*}$

This gives us $A\vec {v}_1=\sigma _1 \vec {u}_1= 3\vec {u}_1$ , so

$\vec {u}_1 = \frac {1}{3}A\vec {v}_1 = \frac {1}{3} \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ] \left [\begin {array}{r} 1 \end {array}\right ] = \frac {1}{3} \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ]$ The vectors $\vec {u}_2$ and $\vec {u}_3$ are eigenvectors of $AA^T$ corresponding to the eigenvalue $\lambda _2=\lambda _3=0$ . Instead of solving the system $(0I-AA^T)\vec {x}= 0$ and then using the Gram-Schmidt process on the resulting set of two basic eigenvectors, the following approach may be used.

Find vectors $\vec {u}_2$ and $\vec {u}_3$ by first extending $\{ \vec {u}_1\}$ to a basis of $\RR ^3$ , then using the Gram-Schmidt algorithm to orthogonalize the basis, and finally normalizing the vectors.

Starting with $\{ 3\vec {u}_1 \}$ instead of $\{ \vec {u}_1 \}$ makes the arithmetic a bit easier. It is easy to verify that

$\left \{ \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ], \left [\begin {array}{r} 1 \\ 0 \\ 0 \end {array}\right ], \left [\begin {array}{r} 0 \\ 1 \\ 0 \end {array}\right ]\right \}$ is a basis of $\RR ^3$ . Set

$\vec {x}_1 = \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ], \vec {x}_2 = \left [\begin {array}{r} 1 \\ 0 \\ 0 \end {array}\right ], \vec {x}_3 =\left [\begin {array}{r} 0 \\ 1 \\ 0 \end {array}\right ]$ and apply the Gram-Schmidt algorithm to $\{ \vec {x}_1, \vec {x}_2, \vec {x}_3\}$ . This gives us

$\vec {f}_1 = \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ], \vec {f}_2 = \left [\begin {array}{r} 4 \\ 1 \\ 1 \end {array}\right ] \mbox { and } \vec {f}_3 = \left [\begin {array}{r} 0 \\ 1 \\ -1 \end {array}\right ]$ Therefore, $\vec {u}_2 = \frac {1}{\sqrt {18}} \left [\begin {array}{r} 4 \\ 1 \\ 1 \end {array}\right ], \vec {u}_3 = \frac {1}{\sqrt 2} \left [\begin {array}{r} 0 \\ 1 \\ -1 \end {array}\right ]$ and $U = \left [ \begin {array}{rrr} -\frac {1}{3} & \frac {4}{\sqrt {18}} & 0 \\ \frac {2}{3} & \frac {1}{\sqrt {18}} & \frac {1}{\sqrt 2} \\ \frac {2}{3} & \frac {1}{\sqrt {18}} & -\frac {1}{\sqrt 2} \end {array}\right ]$ Finally, $A = \left [\begin {array}{r} -1 \\ 2 \\ 2 \end {array}\right ] = \left [ \begin {array}{rrr} -\frac {1}{3} & \frac {4}{\sqrt {18}} & 0 \\ \frac {2}{3} & \frac {1}{\sqrt {18}} & \frac {1}{\sqrt 2} \\ \frac {2}{3} & \frac {1}{\sqrt {18}} & -\frac {1}{\sqrt 2} \end {array}\right ] \left [\begin {array}{r} 3 \\ 0 \\ 0 \end {array}\right ] \left [\begin {array}{r} 1 \end {array}\right ]$

Consider another example.

Find an SVD for the matrix $\begin{equation*} A= \left [ \begin{array}{ccc} \frac{2}{5}\sqrt{2}\sqrt{5} & \frac{4}{5}\sqrt{2}\sqrt{5} & 0 \\ \frac{2}{5}\sqrt{2}\sqrt{5} & \frac{4}{5}\sqrt{2}\sqrt{5} & 0 \end{array} \right ] \end{equation*}$

First consider $A^TA$ $\begin{equation*} \left [ \begin{array}{ccc} \frac{16}{5} & \frac{32}{5} & 0 \\ \frac{32}{5} & \frac{64}{5} & 0 \\ 0 & 0 & 0 \end{array} \right ] \end{equation*}$ What are some eigenvalues and eigenvectors? Some computing shows that the eigenvalues are $0$ and $16$ . Furthermore, we can find a basis for each eigenspace.

$\begin{equation*} \mathcal{S}_0=\mbox{span}\left ( \left [ \begin{array}{c} 0 \\ 0 \\ 1 \end{array} \right ] ,\left [ \begin{array}{c} -\frac{2}{5}\sqrt{5} \\ \frac{1}{5}\sqrt{5} \\ 0 \end{array} \right ] \right ), \quad \mathcal{S}_{16}=\mbox{span}\left ( \left [ \begin{array}{c} \frac{1}{5}\sqrt{5} \\ \frac{2}{5}\sqrt{5} \\ 0 \end{array} \right ] \right ) \end{equation*}$ Thus the matrix $V$ is given by $\begin{equation*} V=\left [ \begin{array}{ccc} \frac{1}{5}\sqrt{5} & -\frac{2}{5}\sqrt{5} & 0 \\ \frac{2}{5}\sqrt{5} & \frac{1}{5}\sqrt{5} & 0 \\ 0 & 0 & 1 \end{array} \right ] \end{equation*}$ Next consider $AA^T$ $\begin{equation*} \left [ \begin{array}{cc} 8 & 8 \\ 8 & 8 \end{array} \right ] \end{equation*}$ Eigenvalues are $0$ and $16$ , and eigenspaces are

$\begin{equation*} \mathcal{S}_0=\mbox{span}\left (\left [ \begin{array}{c} -\frac{1}{2}\sqrt{2} \\ \frac{1}{2}\sqrt{2} \end{array} \right ] \right ),\quad \mathcal{S}_{16}=\mbox{span}\left ( \left [ \begin{array}{c} \frac{1}{2}\sqrt{2} \\ \frac{1}{2}\sqrt{2} \end{array} \right ] \right ) \end{equation*}$ Thus you can let $U$ be given by $\begin{equation*} U=\left [ \begin{array}{cc} \frac{1}{2}\sqrt{2} & -\frac{1}{2}\sqrt{2} \\ \frac{1}{2}\sqrt{2} & \frac{1}{2}\sqrt{2} \end{array} \right ] \end{equation*}$ Let’s check this. $U^TAV=$ $\begin{equation*} \left [ \begin{array}{cc} \frac{1}{2}\sqrt{2} & \frac{1}{2}\sqrt{2} \\ -\frac{1}{2}\sqrt{2} & \frac{1}{2}\sqrt{2} \end{array} \right ] \left [ \begin{array}{ccc} \frac{2}{5}\sqrt{2}\sqrt{5} & \frac{4}{5}\sqrt{2}\sqrt{5} & 0 \\ \frac{2}{5}\sqrt{2}\sqrt{5} & \frac{4}{5}\sqrt{2}\sqrt{5} & 0 \end{array} \right ] \left [ \begin{array}{ccc} \frac{1}{5}\sqrt{5} & -\frac{2}{5}\sqrt{5} & 0 \\ \frac{2}{5}\sqrt{5} & \frac{1}{5}\sqrt{5} & 0 \\ 0 & 0 & 1 \end{array} \right ] \end{equation*}$ $\begin{equation*} =\left [ \begin{array}{ccc} 4 & 0 & 0 \\ 0 & 0 & 0 \end{array} \right ] \end{equation*}$

This illustrates that if you have a good way to find the eigenvectors and eigenvalues for a Hermitian matrix which has nonnegative eigenvalues, then you also have a good way to find the SVD of an arbitrary matrix.

Practice Problems

If $A$ is a square matrix, show that $|\text {det}(A)|$ is the product of the singular values of $A$ .

Find an SVD for each of the following matrices. $A=\begin {bmatrix}1 & -1\\0 & 1\\1 & 0\end {bmatrix},\quad B=\begin {bmatrix}1 & 1 & 1\\-1 & 0 & -2\\1 & 2 & 0\end {bmatrix}$

Find an SVD for $A=\begin {bmatrix}0 & 1\\-1 & 0\end {bmatrix}$ .

Text Source

This section was adapted from Section 8.11 of Keith Nicholson’s Linear Algebra with Applications. (CC-BY-NC-SA)

W. Keith Nicholson, Linear Algebra with Applications, Lyryx 2018, Open Edition.

2024-09-22 18:38:55

Press...	...to do
left/right arrows	Move cursor
shift+left/right arrows	Select region
ctrl+a	Select all
ctrl+x/c/v	Cut/copy/paste
ctrl+z/y	Undo/redo
ctrl+left/right	Add entry to list or column to matrix
shift+ctrl+left/right	Add copy of current entry/column to to list/matrix
ctrl+up/down	Add row to matrix
shift+ctrl+up/down	Add copy of current row to matrix
ctrl+backspace	Delete current entry in list or column in matrix
ctrl+shift+backspace	Delete current row in matrix

Type...	...to get
norm	$\|\|\blue{[?]}\|\|$
text	$\text{\blue{[?]}}$
sym_name	$\backslash\texttt{\blue{[?]}}$
abs	$\left\|\blue{[?]}\right\|$
sqrt	$\sqrt{\blue{[?]}}$
paren	$\left(\blue{[?]}\right)$
floor	$\lfloor \blue{[?]} \rfloor$
factorial	$\blue{[?]}!$
exp	${\blue{[?]}}^{\blue{[?]}}$
sub	${\blue{[?]}}_{\blue{[?]}}$
frac	$\dfrac{\blue{[?]}}{\blue{[?]}}$
int	$\displaystyle\int{\blue{[?]}}d\blue{[?]}$
defi	$\displaystyle\int_{\blue{[?]}}^{\blue{[?]}}\blue{[?]}d\blue{[?]}$
deriv	$\displaystyle\frac{d}{d\blue{[?]}}\blue{[?]}$
sum	$\displaystyle\sum_{\blue{[?]}}^{\blue{[?]}}\blue{[?]}$
prod	$\displaystyle\prod_{\blue{[?]}}^{\blue{[?]}}\blue{[?]}$
root	$\sqrt[\blue{[?]}]{\blue{[?]}}$
vec	$\left\langle \blue{[?]} \right\rangle$
mat	$\left(\begin{matrix} \blue{[?]} \end{matrix}\right)$
*	$\cdot$
infinity	$\infty$
arcsin	$\arcsin\left(\blue{[?]}\right)$
arccos	$\arccos\left(\blue{[?]}\right)$
arctan	$\arctan\left(\blue{[?]}\right)$
sin	$\sin\left(\blue{[?]}\right)$
cos	$\cos\left(\blue{[?]}\right)$
tan	$\tan\left(\blue{[?]}\right)$
sec	$\sec\left(\blue{[?]}\right)$
csc	$\csc\left(\blue{[?]}\right)$
cot	$\cot\left(\blue{[?]}\right)$
log	$\log\left(\blue{[?]}\right)$
ln	$\ln\left(\blue{[?]}\right)$
alpha	$\alpha$
beta	$\beta$
gamma	$\gamma$
delta	$\delta$
epsilon	$\epsilon$
zeta	$\zeta$
eta	$\eta$
theta	$\theta$
iota	$\iota$
kappa	$\kappa$
lambda	$\lambda$
mu	$\mu$
nu	$\nu$
xi	$\xi$
omicron	$\omicron$
pi	$\pi$
rho	$\rho$
sigma	$\sigma$
tau	$\tau$
upsilon	$\upsilon$
phi	$\phi$
chi	$\chi$
psi	$\psi$
omega	$\omega$
Gamma	$\Gamma$
Delta	$\Delta$
Theta	$\Theta$
Lambda	$\Lambda$
Xi	$\Xi$
Pi	$\Pi$
Sigma	$\Sigma$
Phi	$\Phi$
Psi	$\Psi$
Omega	$\Omega$