我有一个来自四个群体、四个治疗和三个重复的个体数据集。每个个体仅在一个群体中,处理和重复组合。我对每个人进行了四次测量。我想对每个群体、底物和复制组合的这些测量进行 PCA。
我知道如何对所有个体进行 PCA,我可以将数据集拆分为多个数据集,以针对种群、底物和复制的每种组合,然后对每个新数据集执行 PCA。
我如何才能对完整的数据集进行 PCA,以最有效地获得每个种群、底物和复制组合的 PC1、PC2... 结果?我想将数据集转换为列表,但不确定如何将 princomp 函数应用于列表。我在正确的轨道上吗?
样本数据:
TestData<- structure(list(Location = c("A", "A", "A", "A", "A", "A", "A", "A", "A", "A", "A", "A",
"B", "B", "B", "B", "B", "B", "B", "B", "B", "B", "B", "B",
"C", "C", "C", "C", "C", "C", "C", "C", "C", "C", "C", "C",
"D", "D", "D", "D", "D", "D", "D", "D", "D", "D", "D", "D"),
Substrate = c("A", "B", "C", "D", "A", "B", "C", "D", "A", "B", "C", "D",
"A", "B", "C", "D", "A", "B", "C", "D", "A", "B", "C", "D",
"A", "B", "C", "D", "A", "B", "C", "D", "A", "B", "C", "D",
"A", "B", "C", "D", "A", "B", "C", "D", "A", "B", "C", "D"),
Replicate = c(1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L,
1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L,
1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L,
1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L),
Adult_Weight = c(0.0092, 0.0083, 0.0088, 0.0077, 0.0088, 0.01,
0.0099, 0.011, 0.0078, 0.0086, 0.0071, 0.0093,
0.0111, 0.01, 0.0097, 0.0091, 0.0083, 0.0098,
0.0093, 0.009, 0.0114, 0.0087, 0.0094, 0.0096,
0.0099, 0.0105, 0.0091, 0.0115, 0.0106, 0.0104,
0.0113, 0.0115, 0.0107, 0.0126, 0.0106, 0.0101,
0.0095, 0.0113, 0.0111, 0.0118, 0.0114, 0.0123,
0.0119, 0.0103, 0.0119, 0.0116, 0.0112, 0.0114),
Adult_Thorax_Width = c(1.31, 1.31, 1.43, 1.45, 1.52, 1.43, 1.57, 1.45, 1.43, 1.54, 1.32, 1.49,
1.58, 1.36, 1.42, 1.45, 1.48, 1.38, 1.55, 1.46, 1.52, 1.42, 1.6, 1.49,
1.48, 1.58, 1.51, 1.53, 1.54, 1.76, 1.63, 1.62, 1.44, 1.51, 1.53, 1.58,
1.46, 1.94, 1.54, 2.09, 1.5, 1.65, 1.86, 1.54, 1.8, 1.98, 1.82, 1.63),
Adult_Wing_Length = c(1359L, 1377L, 1555L, 1559L, 1562L, 1578L, 1580L, 1588L, 1597L, 1598L, 1603L, 1605L,
1612L, 1614L, 1616L, 1617L, 1623L, 1628L, 1639L, 1642L, 1643L, 1649L, 1651L, 1652L,
1653L, 1653L, 1654L, 1656L, 1656L, 1656L, 1662L, 1664L, 1665L, 1668L, 1670L, 1670L,
1671L, 1672L, 1674L, 1682L, 1685L, 1687L, 1688L, 1694L, 1698L, 1698L, 1707L, 1708L),
Adult_Leg_Length = c(414L, 390L, 627L, 541L, 430L, 450L, 451L, 462L, 443L, 582L, 435L, 579L,
499L, 418L, 444L, 646L, 589L, 466L, 435L, 477L, 450L, 606L, 660L, 450L,
446L, 480L, 462L, 438L, 483L, 454L, 492L, 457L, 463L, 499L, 470L, 474L,
627L, 478L, 473L, 496L, 666L, 499L, 480L, 461L, 450L, 483L, 460L, 584L)),
.Names = c("Location", "Substrate", "Replicate", "Weight", "Thorax_Width", "Wing_Length", "Leg_Length"),
row.names = c(NA, 48L),
class = "data.frame")