Ejemplo: análisis de componentes principales 1

<region id="ID0ERLOU" top="364.80000000000007" left="38.400000000000006" height="214" width="575" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <plot background-type="white" xml:lang="es">
    <xyPlot xml:lang="es">
      <title class="- topic/title " xml:lang="es" toc="yes" wwtype:type="Paragraph" xmlns:wwtype="urn:WebWorks-Type-Schema" />
      <legend xml:lang="es" />
      <traces xml:lang="es">
        <trace resultRef="128" xml:lang="es">
          <traceStyle color="#FF00008B" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
        <trace resultRef="129" xml:lang="es">
          <traceStyle color="#FFFF0000" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
      </traces>
      <graph-size width="436.6" height="137.2" xml:lang="es" />
      <axes xml:lang="es">
        <xAxis rank="1" legend-position="PlotBoundaryBottom" start="2.6" end="4.6" xml:lang="es">
          <axisLine position="ticknumberlock" positionticmark="0" legendWidth="100.183333333333" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">6</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="136" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">Data</id>
                  <real xml:lang="es">0</real>
                </apply>
              </math>
              <math resultRef="137" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue resultRef="131" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">2.6</real>
            </startValue>
            <secondTickValue resultRef="133" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">3.0</real>
            </secondTickValue>
            <endValue xml:lang="es" resultRef="135">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">4.5</real>
            </endValue>
          </xyDomain>
        </xAxis>
        <yAxis rank="1" legend-position="PlotBoundaryLeft" start="2" end="5" xml:lang="es">
          <axisLine position="ticknumberlock" positionticmark="0" legendWidth="100.183333333333" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">7</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="144" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">Data</id>
                  <real xml:lang="es">1</real>
                </apply>
              </math>
              <math resultRef="145" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
            <plotEquation xml:lang="es">
              <math resultRef="146" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">Data</id>
                  <real xml:lang="es">2</real>
                </apply>
              </math>
              <math resultRef="147" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue resultRef="139" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">2</real>
            </startValue>
            <secondTickValue resultRef="141" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">2.5</real>
            </secondTickValue>
            <endValue xml:lang="es" resultRef="143">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">5.0</real>
            </endValue>
          </xyDomain>
        </yAxis>
      </axes>
    </xyPlot>
  </plot>
</region>

<region id="ID0E3POU" top="825.60000000000014" left="38.400000000000006" height="38.952000000000005" width="200.26333333333335" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <math resultRef="164" xml:lang="es">
    <define xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
      <apply xml:lang="es">
        <indexer xml:lang="es" />
        <id labels="*" xml:space="preserve" xml:lang="es">MeanData</id>
        <id labels="*" xml:space="preserve" xml:lang="es">j</id>
      </apply>
      <apply xml:lang="es">
        <id labels="FUNCTION" xml:space="preserve" xml:lang="es" label-is-contextual="true">mean</id>
        <apply xml:lang="es">
          <matcol xml:lang="es" />
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">Data</id>
          <id xml:space="preserve" xml:lang="es">j</id>
        </apply>
      </apply>
    </define>
    <resultFormat xml:lang="es">
      <matrix size="12,12" offset="0,0" show-indices="false" expand-nested-arrays="false" xml:lang="es" />
    </resultFormat>
  </math>
</region>

<region id="ID0EOQOU" top="883.20000000000016" left="38.400000000000006" height="36.800000000000004" width="190.07" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <math resultRef="166" xml:lang="es">
    <define xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
      <apply xml:lang="es">
        <indexer xml:lang="es" />
        <id labels="*" xml:space="preserve" xml:lang="es">C</id>
        <sequence xml:lang="es">
          <id labels="*" xml:space="preserve" xml:lang="es">i</id>
          <id labels="*" xml:space="preserve" xml:lang="es">j</id>
        </sequence>
      </apply>
      <apply xml:lang="es">
        <minus xml:lang="es" />
        <apply xml:lang="es">
          <indexer xml:lang="es" />
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">Data</id>
          <sequence xml:lang="es">
            <id xml:space="preserve" xml:lang="es">i</id>
            <id xml:space="preserve" xml:lang="es">j</id>
          </sequence>
        </apply>
        <apply xml:lang="es">
          <indexer xml:lang="es" />
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">MeanData</id>
          <id xml:space="preserve" xml:lang="es">j</id>
        </apply>
      </apply>
    </define>
    <resultFormat xml:lang="es">
      <matrix size="12,12" offset="0,0" show-indices="false" expand-nested-arrays="false" xml:lang="es" />
    </resultFormat>
  </math>
</region>

<region id="ID0EDSOU" top="960.00000000000011" left="38.400000000000006" height="312" width="574" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <plot background-type="white" origin-positioning="true" xml:lang="es">
    <xyPlot xml:lang="es">
      <title class="- topic/title " xml:lang="es" toc="yes" wwtype:type="Paragraph" xmlns:wwtype="urn:WebWorks-Type-Schema" />
      <legend xml:lang="es" />
      <traces xml:lang="es">
        <trace resultRef="168" xml:lang="es">
          <traceStyle color="#FF00008B" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
        <trace resultRef="169" xml:lang="es">
          <traceStyle color="#FFFF0000" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
      </traces>
      <graph-size width="454.8" height="235.2" xml:lang="es" />
      <axes xml:lang="es">
        <xAxis rank="1" legend-position="PlotBoundaryBottom" start="-1" end="1" xml:lang="es">
          <axisLine position="origin" positionticmark="3" legendWidth="77.7566666666667" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">11</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="174" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">C</id>
                  <real xml:lang="es">0</real>
                </apply>
              </math>
              <math resultRef="175" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue resultRef="171" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">-1.</real>
            </startValue>
            <endValue xml:lang="es" resultRef="173">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">1.0</real>
            </endValue>
          </xyDomain>
        </xAxis>
        <yAxis rank="1" legend-position="PlotBoundaryLeft" start="-1.5" end="1.5" xml:lang="es">
          <axisLine position="origin" positionticmark="5" legendWidth="77.7566666666667" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">7</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="182" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">C</id>
                  <real xml:lang="es">1</real>
                </apply>
              </math>
              <math resultRef="183" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
            <plotEquation xml:lang="es">
              <math resultRef="184" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">C</id>
                  <real xml:lang="es">2</real>
                </apply>
              </math>
              <math resultRef="185" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue resultRef="177" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">-1.5</real>
            </startValue>
            <secondTickValue resultRef="179" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">-1.0</real>
            </secondTickValue>
            <endValue xml:lang="es" resultRef="181">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">1.5</real>
            </endValue>
          </xyDomain>
        </yAxis>
      </axes>
    </xyPlot>
  </plot>
</region>

• Ahora los datos están centrados alrededor del origen. Este es uno de los pasos que la función Nipals realiza automáticamente.

• En muchas aplicaciones de PCA, también es recomendable aplicar una escala a los datos de modo que las variables tengan pesos iguales como, por ejemplo, cuando variables diferentes tienen unidades diferentes. El escalado de todas las variables (cada columna de datos) a una varianza unitaria es habitual, pero no es adecuado para estos datos, por lo que no se debe aplicar ningún escalado.

<region id="ID0EZYOU" top="1612.8000000000002" left="38.400000000000006" height="25.6" width="499.89333333333337" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <math resultRef="203" xml:lang="es">
    <define xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
      <id labels="*" xml:space="preserve" xml:lang="es">NIPALS_Result</id>
      <apply xml:lang="es">
        <id labels="FUNCTION" xml:space="preserve" xml:lang="es" label-is-contextual="true">Nipals</id>
        <sequence xml:lang="es">
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">Data</id>
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">NumPC</id>
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">MaxIteration</id>
          <str xml:space="preserve" xml:lang="es">noscale</str>
          <id labels="VARIABLE" xml:space="preserve" xml:lang="es" label-is-contextual="true">Acc</id>
        </sequence>
      </apply>
    </define>
    <resultFormat xml:lang="es">
      <matrix size="12,12" offset="0,0" show-indices="false" expand-nested-arrays="false" xml:lang="es" />
    </resultFormat>
  </math>
</region>

<region id="ID0EOCPU" top="2611.2000000000003" left="38.400000000000006" height="312" width="578" xml:lang="es" xmlns="http://schemas.mathsoft.com/worksheet50">
  <plot background-type="white" origin-positioning="true" xml:lang="es">
    <xyPlot xml:lang="es">
      <title class="- topic/title " xml:lang="es" toc="yes" wwtype:type="Paragraph" xmlns:wwtype="urn:WebWorks-Type-Schema" />
      <legend xml:lang="es" />
      <traces xml:lang="es">
        <trace resultRef="217" xml:lang="es">
          <traceStyle color="#FF00008B" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
        <trace resultRef="218" xml:lang="es">
          <traceStyle color="#FFFF0000" symbol="x" line-weight="1" line-style="None" xml:lang="es">lines</traceStyle>
        </trace>
      </traces>
      <graph-size width="420.4" height="235.2" xml:lang="es" />
      <axes xml:lang="es">
        <xAxis rank="1" legend-position="PlotBoundaryBottom" start="-2" end="2" xml:lang="es">
          <axisLine position="origin" positionticmark="5" legendWidth="130.073333333333" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">11</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="219" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">SCORES</id>
                  <real xml:lang="es">0</real>
                </apply>
              </math>
              <math resultRef="220" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue xml:lang="es">
              <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
            </startValue>
            <endValue xml:lang="es">
              <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
            </endValue>
          </xyDomain>
        </xAxis>
        <yAxis rank="1" legend-position="PlotBoundaryLeft" start="-0.5" end="0.6" xml:lang="es">
          <axisLine position="origin" positionticmark="5" legendWidth="130.073333333333" xml:lang="es" />
          <axisGrid xml:lang="es">
            <gridFrequency xml:lang="es">12</gridFrequency>
            <gridLabels display="true" xml:lang="es" />
            <gridLines xml:lang="es" />
            <tickMarks display="true" xml:lang="es" />
          </axisGrid>
          <axisLabel xml:lang="es" />
          <markers xml:lang="es" />
          <numberFormat xml:lang="es">
            <general precision="3" show-trailing-zeros="false" radix="dec" zero-threshold="15" imaginary-value="i" exponential-threshold="3" xml:lang="es" />
          </numberFormat>
          <plotEquations xml:lang="es">
            <plotEquation xml:lang="es">
              <math resultRef="227" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">SCORES</id>
                  <real xml:lang="es">1</real>
                </apply>
              </math>
              <math resultRef="228" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
            <plotEquation xml:lang="es">
              <math resultRef="229" xml:lang="es">
                <apply xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">
                  <matcol xml:lang="es" />
                  <id xml:space="preserve" xml:lang="es">SCORES</id>
                  <real xml:lang="es">2</real>
                </apply>
              </math>
              <math resultRef="230" xml:lang="es">
                <placeholder xml:lang="es" xmlns="http://schemas.mathsoft.com/math50" />
              </math>
            </plotEquation>
          </plotEquations>
          <xyDomain scale-type="linear" auto-scale="true" xml:lang="es">
            <startValue resultRef="222" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">-0.5</real>
            </startValue>
            <secondTickValue resultRef="224" xml:lang="es">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">-0.4</real>
            </secondTickValue>
            <endValue xml:lang="es" resultRef="226">
              <real xml:lang="es" xmlns="http://schemas.mathsoft.com/math50">0.5</real>
            </endValue>
          </xyDomain>
        </yAxis>
      </axes>
    </xyPlot>
  </plot>
</region>