将 nls 拟合到分组数据 R

Question

我正在尝试将非线性模型拟合到整个季节中在多个地块上收集的一系列测量值。下面是来自较大数据集的子样本。数据：

dput(nee.example) structure(list(julian = c(159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 159L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L, 169L), blk = structure(c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L), .Label = c("e", "w"), class = "factor"), type = structure(c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L), .Label = c("b", "g"), class = "factor"), plot = c(1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L, 3L, 1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L, 3L, 3L), trt = structure(c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = "a", class = "factor"), cloth = c(25L, 50L, 75L, 100L, 0L, 25L, 50L, 75L, 100L, 0L, 25L, 50L, 75L, 100L, 0L, 25L, 50L, 100L, 0L, 25L, 50L, 75L, 100L, 0L, 25L, 50L, 75L, 75L, 100L), plotID = c(1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L, 3L, 13L, 13L, 13L, 13L, 14L, 14L, 14L, 14L, 14L, 15L, 15L, 15L, 15L, 15L, 15L ), flux = c(0.76, 0.6, 0.67, 0.7, 1.72, 1.63, -7.8, 0.89, 0.51, 0.76, 0.48, 0.62, 0.18, 0.21, 3.87, 2.44, 1.26, -1.39, 2.18, 1.9, 0.81, -0.04, -0.83, 1.99, 1.55, 0.57, -0.02, -0.16, -2.12), ChT = c(18.6, 19.1, 19.6, 19.1, 16.5, 17.3, 18.3, 19, 18.6, 17.2, 18.4, 19, 19.2, 20.6, 22, 21.9, 22.4, 23.8, 20.7, 21.5, 22.5, 23.3, 23.8, 20.1, 20.8, 21.2, 21.8, 21.8, 21.4), par = c(129.9, 210.2, 305.4, 796.6, 1.3, 62.7, 149.9, 171.2, 453.3, 1.3, 129.7, 409.3, 610, 1148.6, 1.3, 115.2, 237, 814.6, 1.3, 105.4, 293.4, 472.1, 955.9, 1.3, 100.5, 290, 467, 413.6, 934.2)), .Names = c("julian", "blk", "type", "plot", "trt", "cloth", "plotID", "flux", "ChT", "par"), class = "data.frame", row.names = c(NA, -29L))

我需要将以下模型（rec.hyp，如下）拟合到每个日期的每个地块，并检索每个 julian-plotID 组合的参数估计值。经过一番探索之后，听起来 nlsList 是一个理想的函数，因为它具有分组方面的特点：

library(nlme)
rec.hyp <- nlsList(flux ~ Re - ((Amax*par)/(k+par)) | julian/plotID,
             data=nee.example,
             start=c(Re=3, k=300, Amax=5),
             na.action=na.omit)
coef(rec.hyp)

但是我不断收到相同的错误消息：

Error in nls(formula = formula, data = data, start = start, control = control) : 
step factor 0.000488281 reduced below 'minFactor' of 0.000976562

我尝试调整 nls.control 中的控件以增加 maxIter 和 tol，但显示相同的错误消息。而且我已经改变了初始起始值无济于事。

需要注意的是，为了与之前的工作保持一致，我需要使用最小二乘法来拟合模型。

问题：

nlsList 是否允许我的分组结构。换句话说，我可以在 julian 中嵌套 plotID 吗？这可能是我错误的根源吗？
我读到不适当的起始参数估计会导致错误消息，但在更改它们后我得到了相同的消息。

我觉得我在这里遗漏了一些简单的东西，但我的大脑被炸了。

提前致谢。

Answer 1

问题 1 的回答：您的分组结构是正确的。您可以通过运行 nls 对您的数据子集进行验证：

rec.hyp.test <- nls(flux ~ Re - ((Amax*par)/(k+par)),
                   data=subset(nee.example,julian==159 & plotID==3),
                   start=c(Re=3, k=300, Amax=5),
                   na.action=na.omit)
coef(rec.hyp.test)
#        Re           k        Amax 
# 0.7208943 792.4412287   0.8972519 

coef(rec.hyp)[3,]
#              Re        k      Amax
# 159/3 0.7208943 792.4412 0.8972519

问题 2 的回答：某些数据集无法通过给定模型正确拟合。根据 flux ~ Re - ((Amax*par)/(k+par)) 公式，人们可能期望 flux 随 par 单调递减（或递增，如果 Amax < 0）。出于好奇，我绘制了导致 nls 失败的数据集之一：

plot(flux~par,subset(nee.example,julian==159 & plotID==1))

发现一点都不单调，甚至可以说一点趋势都没有！我想即使你强迫 nls 为这种情况找到一些解决方案，它也很可能是虚假的，所以你可能只想让它不适合（即 NA）。

我还建议对输入数据和拟合模型质量进行目视检查。使用 R 和 reshape2 和 ggplot2 等包，您可以轻松绘制数百个，甚至快速浏览一下也能帮助您远离麻烦。

将 nls 拟合到分组数据 R

Fitting nls to grouped data R

r

nls