Question

我已经生成了一个看起来像这样的文件（这里是一个摘录，大致上两个文件中的每一个都有一个共同的列1和2的名称乘以一个不同的参数，最合适的，即最低的chi2，是在第3列中返回第4和第5列中的适当参数：

10 05 0.42 0.13 0.01   
10 10 0.30 0.12 0.01  
10 15 0.25 0.11 0.07  
15 05 0.29 0.12 0.01  
15 10 0.25 0.11 0.06  
15 15 0.23 0.10 0.02  
20 05 0.25 0.11 0.03  
20 10 0.23 0.12 0.04  
20 15 0.23 0.13 0.05  
25 05 0.23 0.10 0.03  
25 10 0.23 0.10 0.08  
25 15 0.24 0.09 0.05

我正在开始/学习使用列表，因为我的代码实际上是使用for循环减慢（目前我正在使用4 for循环所以它太疯狂了），我不知道重写我的优化代码，所以它不需要8个小时才能工作。所以相反，为了重新组织输出，我想知道是否可以创建一个列表，如mytemplist，其内容如下：

> mytemplist  
$5 
[1] 10 15 20 25  
[2] 0.42 0.29 0.25 0.23  
[3] 0.13 0.12 0.11 0.10
[4] 0.01 0.01 0.03 0.03  

$10  
[1] 10 15 20 25  
[2] 0.30 0.25 0.23 0.23
[3] 0.12 0.11 0.12 0.10  
[4] 0.01 0.06 0.04 0.08  

$15  
[1] 10 15 20 25  
[2] 0.25 0.23 0.23 0.24  
[3] 0.11 0.10 0.13 0.09  
[4] 0.07 0.02 0.05 0.05

我查看了有关列表的问题，我只能通过在列表中创建列表来解决这个问题，而这些列表在这里没有帮助。

编辑：
接受的答案回复上面的具体问题，回答@rawr帖子我加入文件是如何生成的（它不漂亮，我没有使用opt，因为我将进化代码以优化数据点的更大自由度）：
注意：要读取的典型文件是2列文件（只是数字列表），并命名为a10b05s和a10b05t
dataname也是一个2列的文件
在这3个文件中，第一列是相同的并代表枢轴
需要找到par [1]和par [2]，使par [1] * a10b05s + par [2] * a10b05t最适合数据

par <- rep(NA, 2)
pivot <- read.table(dataname)[[1]]
data2fit <- read.table(dataname)[[2]]

for (i in 1:10){
    vala <- 10+5*(i-1)
    namei <- paste("a", vala, sep="")

    for (j in 1:10){
        #creates a coordinates for storage
        cglobal <- (i-1) * 10 + j           

        valb <- 5+5*(j-1)
        namej1 <- paste(namei, "b", valb, "s", sep="")
        namej2 <- paste(namei, "b", valb, "t", sep="")
        infile1 <- read.table(namej1)
        infile2 <- read.table(namej2)

        # infile1 prominent wrt infile2 so first quick determination of par1 
        tempspace1 <- seq(0.001, 0.009, 0.001)
        par1_s1 <- c(tempspace1, tempspace1*10, tempspace1*100) 
        opt1_par1 <- rep(NA, length(par1))

        # set a pivot for comparison at position named temppivot find par1 wrt temppivot
        for(k in 1:length(par1){
            opt1_par1[k] <- abs(par1_s1[k]*infile1[[1]][temppivot] - data2fit[temppivot])
        }

        par[1] <- par1_s1[match(min(opt1_par1)), opt1_par1]

        # set a space for a finer fit for par[1]
        par1_s2 <- seq(par[1]-5*par[1]/10, par[1]+5*par[1]/10, par[1]/100)

        # set a space to fit par[2] note that there is an option in the code to choose btw 0.001-0.01, 0.01-0.1 etc.
        tempspace2 <- seq(0.001, 0.009, 0.0001)
        par2 <- c(tempspace2, tempspace2*10, tempspace2*100)
        chi2 <- rep(NA, length(par1_s2)*length(par2))
        #data2fit 

        for(z in 1:length(par1_s2)){
            for(w in 1:length(par2)){
                par[1] <- par1_s2[z]
                par[2] <- par2[w]
                thesum <- rep(NA, length(pivot))
                    for(h in 1:length(pivot)){
                        c1 <- pivot[h]
                        thesum[h] <- par[1] * infile[[1]][c1] + par[2] * infile2[[1]][c1]
                    }
            c2 <- (z-1) * length(par2) + w
            chi2[c2] <- sum((thesum-data2fit)^2/thesum)
            }
        }

        whichbestfit <- match(min(chi2), chi2)
        chi2min <- min(chi2)

        localparfinder <- function(x){
            temp1 <- trunc(x/length(par2)) + 1
            temp2 <- x - (temp1 -1) * length(par2)
            y <- c(par1_s2[temp1], par2[temp2])
            }

        par <- localparfinder(whichbestfit)

        # creates the table of the original post
        storage[cglobal,] <- c(vala, valb, chi2min, par[1], par[2])
    }
}


write.table(storage, file=paste("storage_", format(Sys.time(), "%d%b_%H%M"), ".dat", sep="")

Answer 1

您可以使用by和t ranspose，如下所示：

by(mydf[-2], mydf[[2]], t)
# mydf[[2]]: 5
#        1     4     7    10
# V1 10.00 15.00 20.00 25.00
# V3  0.42  0.29  0.25  0.23
# V4  0.13  0.12  0.11  0.10
# V5  0.01  0.01  0.03  0.03
# ----------------------------------------------------------- 
# mydf[[2]]: 10
#        2     5     8    11
# V1 10.00 15.00 20.00 25.00
# V3  0.30  0.25  0.23  0.23
# V4  0.12  0.11  0.12  0.10
# V5  0.01  0.06  0.04  0.08
# ----------------------------------------------------------- 
# mydf[[2]]: 15
#        3     6     9    12
# V1 10.00 15.00 20.00 25.00
# V3  0.25  0.23  0.23  0.24
# V4  0.11  0.10  0.13  0.09
# V5  0.07  0.02  0.05  0.05

以上结果是list，其类别为by。如果您对其使用了unclass，则会与split + lapply方法类似。

Answer 2

这是一种可能性：

lst <- split(df[-2], df$V2)   # split according to colum 2 and drop column 2 in the output

lst <- lapply(lst, t)         # transpose each list element
lst
#   $`5`
#       1     4     7    10
#V1 10.00 15.00 20.00 25.00
#V3  0.42  0.29  0.25  0.23
#V4  0.13  0.12  0.11  0.10
#V5  0.01  0.01  0.03  0.03
#
#$`10`
#       2     5     8    11
#V1 10.00 15.00 20.00 25.00
#V3  0.30  0.25  0.23  0.23
#V4  0.12  0.11  0.12  0.10
#V5  0.01  0.06  0.04  0.08
#
#$`15`
#       3     6     9    12
#V1 10.00 15.00 20.00 25.00
#V3  0.25  0.23  0.23  0.24
#V4  0.11  0.10  0.13  0.09
#V5  0.07  0.02  0.05  0.05

如果你喜欢它更紧凑，你也可以像这样嵌套分裂和lapply：

lst <- lapply(split(df[-2], df$V2), t)

如何在列表的元素中存储多个向量？

2 个答案: