Fitting cell growth model (Monod) with 3 PDEs in R

Question

Hi everybody, I'm trying to fit the experimental data on a set of 3 PDEs to find 4 coefficients including mumax, Ks, Y_(x/s), and Y_(p/s). The code I used worked with the set of 2 PDEs but is not working with this set of 3. The following is the code:

The set of PDEs needs to be fitted:

dX/dt = mumax. S. X / (Ks + S)

dS/dt = -1/Y_(x/s). mumax. S. X / (Ks + S)

dP/dt = 1/Y_(p/s). mumax. S. X / (Ks + S)

library(deSolve)
library(ggplot2) 
library(minpack.lm) # library for least squares fit using levenberg-marquart algorithm
library(reshape2)

t = c(0, 3, 5, 8, 9.5, 11.5, 14, 16, 18, 20, 25, 27)
x = c(0.0904, 0.1503, 0.2407, 0.3864, 0.5201, 0.6667, 0.8159, 0.9979, 1.0673, 1.1224, 1.1512, 1.2093)
s = c(9.0115, 8.8088, 7.9229, 7.2668, 5.3347, 4.911, 3.5354, 1.4041, 0, 0, 0, 0)
p = c(0.0151, 0.0328, 0.0621, 0.1259, 0.2949, 0.3715, 0.4199, 0.522, 0.5345, 0.6081, 0.07662, 0.7869)
data2 <- data.frame(t,x,s,p)

data2.1=melt(data2,id.vars=c("t"),variable.name="Substance",value.name="Concentration")
ggplot(data=data2.1,aes(x=t,y=Concentration,color=Substance))+geom_point(size=3)

Monod2 <- function(t,c,parms) {
  
  k1 <- parms$k1 # mumax
  k2 <- parms$k2 # Ks
  k3 <- parms$k3 # Y_(X/S)
  k4 <- parms$k4 # alpha
  k5 <- parms$k4 # beta
  
  r=rep(0,length(c)) # c is the concentration either X or S 
  
  r[1] <-  k1 * c["S"] * c["X"] / ( k2 + c["S"] ) # r[1] = dCx/dt = k1.Cs.Cx/(k2+Cs)
  
  r[2] <- -k1 * c["S"] * c["X"] / ( ( k2 + c["S"] ) * k3 ) # r[2] = dCs/dt = -1/k3 * dCx/dt 
  
  r[3] <-  k4 * r[1] + k5 * c["X"] # r[3] = dCp/dt = alpha * dX/dt + beta * X
  
  return(list(r))       
  
}

cinit=c(data2[1,2], data2[1,3], data2[1,4])
t=data2$t
parms=list(k1=0.1, k2=5, k3=1, k4=0.08, k5 = 0.005)
out=ode(y=cinit, 
        times=t,
        func=Monod2,
        parms=parms
)
head(out)

ssq = function(parms){
  
  # inital concentration:
  cinit = c( x=data2[1,2], s=data2[1,3], p=data2[1,4] )
  
  # time points for which conc is reported including the points where data is available:
  t = c(seq(0, 27, 1), data2$t)
  t = sort(unique(t))
  
  # parameters from the parameter estimation routine:
  k1 = parms[1]
  k2 = parms[2]
  k3 = parms[3]
  k4 = parms[4]
  
  # solve ODE for a given set of parameters:
  out = ode( y = cinit, times = t, func = Monod2, parms = list( k1 = k1, k2 = k2, k3 = k3, k4 = k4) )
  
  # Filter data that contains time points where data is available:
  out_Monod2 = data.frame(out)
  out_Monod2 = out_Monod2[out_Monod2$t %in% data2$t,]
  
  # Evaluate predicted vs experimental residual:
  pred_Monod2 = melt(out_Monod2,id.var="t",variable.name="Substance",value.name="Concentration")
  exp_Monod2 = melt(data2,id.var="t",variable.name="Substance",value.name="Concentration")
  ssqres=pred_Monod2$conc-exp_Monod2$conc
  
  # return predicted vs experimental residual
  return(ssqres)
  
}

# initial guess for parameters: 
parms=c(k1=0.5, k2=6.5, k3=0.2, k4=1.2)
# fitting
fitval=nls.lm(par=parms,fn=ssq)
summary(fitval)

I got the error as the following

Error: id variables not found in data: t

This code works with a set of 2 PDEs

# Data: 
time = c(10, 18, 25, 33, 37, 40, 44)
X    = c(1.5, 2.9, 5.5, 11.4, 16.3, 19.2, 20.9)
S    = c(48.5, 45.2, 38.8, 24.0, 11.8, 4.5, 0.3)
monod = data.frame(time,X,S)
monod

# Define the PDEs:
Monod <- function(t,c,parms) {
  
  k1 <- parms$k1
  k2 <- parms$k2
  k3 <- parms$k3
  
  r=rep(0,length(c)) # c is the concentration either X or S 
  
  r[1] <-  k1 * c["S"] * c["X"] / ( k2 + c["S"] ) # r[1] = dCx/dt = k1.Cs.Cx/(k2+Cs)
  
  r[2] <- -k1 * c["S"] * c["X"] / ( ( k2 + c["S"] ) * k3 ) # r[2] = dCs/dt = -1/k3 * dCx/dt 
  
  return(list(r))       
  
  
}

# Boundary and Initial conditions and ODE solver 
cinit=c(X=1.5, S = 48.5)

t=monod$time

parms=list(k1=0.09742736, k2=3.762556, k3=0.4036112)

out=ode(y=cinit, 
        times=t,
        func=Monod,
        parms=parms
)

head(out)

# Calculate sum of squares of residuals: 
ssq = function(parms){
  
  # inital concentration:
  cinit = c( X = 1.5, S = 48.5 )
  
  # time points for which conc is reported including the points where data is available:
  t = c(seq(10, 44, 2), monod$time)
  t = sort(unique(t))
  
  # parameters from the parameter estimation routine:
  k1 = parms[1]
  k2 = parms[2]
  k3 = parms[3]
  
  # solve ODE for a given set of parameters:
  out = ode( y = cinit, times = t, func = Monod, parms = list( k1 = k1, k2 = k2, k3 = k3) )
  
  # Filter data that contains time points where data is available:
  out_Monod = data.frame(out)
  out_Monod = out_Monod[out_Monod$time %in% monod$time,]
  
  # Evaluate predicted vs experimental residual:
  pred_Monod = melt(out_Monod,id.var="time",variable.name="species",value.name="conc")
  exp_Monod = melt(monod,id.var="time",variable.name="species",value.name="conc")
  ssqres=pred_Monod$conc-exp_Monod$conc
  
  # return predicted vs experimental residual
  return(ssqres)
  
}
# The parameter fitting is done using Levenberg-Marquardt routine in package minpack.lm.
# initial guess for parameters: 
parms=c(k1=0.1,k2=5,k3=1)
# fitting
fitval=nls.lm(par=parms,fn=ssq)
summary(fitval)

# Estimated parameters:
parest=as.list(coef(fitval))
parest

## plotting the data and the fitting curves:
# plot of predicted vs experimental data
# simulated predicted profile at estimated parameter values
cinit=c(X=1.5,S=48.5)
t=seq(10,44,2)
parms=as.list(parest)
out=ode(y=cinit,times=t,func=Monod,parms=parms)
out_Monod=data.frame(out)
names(out_Monod)=c("time","X_pred","S_pred")

# Overlay predicted profile with experimental data
tmppred=melt(out_Monod,id.var=c("time"),variable.name="Substance",value.name="Concentration")
tmpexp=melt(monod,id.var=c("time"),variable.name="Substance",value.name="Concentration")
p=ggplot(data=tmppred,aes(x=time,y=Concentration,color=Substance,linetype=Substance))+geom_line()
p=p+geom_line(data=tmpexp,aes(x=time,y=Concentration,color=Substance,linetype=Substance))
p=p+geom_point(data=tmpexp,aes(x=time,y=Concentration,color=Substance))
p=p+scale_linetype_manual(values=c(0,1,0,1,0,1))
p=p+scale_color_manual(values=rep(c("red","blue"),each=2))+theme_bw()
print(p)

Answer 1

The original code had several issues:

the state variables were lower case in the data, upper case in the model and without any name in the initial values
time was called t in the data and time in the ode output
concentration had the name Concentration in one place and conc in another
The names ssq and ssqres were misleading as the function calculates the residuals and not the square and not a sum. The sum of squares is calculated in the background (see ?nls.lm )
the assignment operators <- and = were inconsistently used. This is not an error, but not really good style.
instead of artificial names k1, K2, ... one can directly use original names like mumax or alpha .
It is not clear why names like data2 or Monod2 were used as there was no data1 .

Fixing all this, we come to the solution below. It runs through and fits somehow, but it can still be improved. The warnings may be ignored for now. The reason is, that parameters exceed the allowed range. This can of course be fixed but would be another question.

library(deSolve)
library(ggplot2) 
library(minpack.lm)
library(reshape2)

data <- data.frame(
  time = c(0, 3, 5, 8, 9.5, 11.5, 14, 16, 18, 20, 25, 27),
  X = c(0.0904, 0.1503, 0.2407, 0.3864, 0.5201, 0.6667, 0.8159, 0.9979, 1.0673, 1.1224, 1.1512, 1.2093),
  S = c(9.0115, 8.8088, 7.9229, 7.2668, 5.3347, 4.911, 3.5354, 1.4041, 0, 0, 0, 0),
  P = c(0.0151, 0.0328, 0.0621, 0.1259, 0.2949, 0.3715, 0.4199, 0.522, 0.5345, 0.6081, 0.07662, 0.7869)
)

Monod <- function(t, c, parms) {
  k1 <- parms$k1 # mumax
  k2 <- parms$k2 # Ks
  k3 <- parms$k3 # Y_(X/S)
  k4 <- parms$k4 # alpha
  k5 <- parms$k4 # beta
  r <- numeric(length(c))
  r[1] <-  k1 * c["S"] * c["X"] / (k2 + c["S"])
  r[2] <- -k1 * c["S"] * c["X"] / ((k2 + c["S"]) * k3)
  r[3] <-  k4 * r[1] + k5 * c["X"]
  return(list(r))       
}

cinit <- c(X = data[1, 2], S = data[1, 3], P = data[1, 4])
t <- data$time
parms <- list(k1=0.1, k2=5, k3=1, k4=0.08, k5 = 0.005)

out <- ode(y=cinit, times=t, func = Monod, parms=parms)
plot(out)

residuals <- function(parms){
  cinit <- c(X = data[1, 2], S = data[1, 3], P = data[1, 4] )
  
  # time points for which conc is reported including the points where data is available
  t <- c(seq(0, 27, 1), data$t)
  t <- sort(unique(t))
  
  # parameters from the parameter estimation routine:
  k1 <- parms[1]
  k2 <- parms[2]
  k3 <- parms[3]
  k4 <- parms[4]
  
  # solve ODE for a given set of parameters
  out <- ode(y = cinit, times = t, func = Monod, parms = list( k1 = k1, k2 = k2, k3 = k3, k4 = k4) )
  
  # Filter data that contains time points where data is available:
  out_Monod <- data.frame(out)
  out_Monod <- out_Monod[out_Monod$t %in% data$t,]
  
  # Evaluate predicted vs experimental residual
  pred_Monod <- melt(out_Monod, id.var="time", variable.name="Substance", value.name="conc")
  exp_Monod  <- melt(data, id.var="time", variable.name="Substance", value.name="conc")
  residuals  <- pred_Monod$conc - exp_Monod$conc
  
  # return predicted vs experimental residual
  return(residuals)
}

# initial guess for parameters
parms <- c(k1=0.5, k2=6.5, k3=0.2, k4=1.2)
fitval <- nls.lm(par=parms, fn=residuals)
summary(fitval)

out <- ode(y=cinit, times=seq(min(data$time), max(data$time)), func = Monod, parms=as.list(coef(fitval)))
plot(out, obs=data, mfrow=c(1, 3))

拟合模型

Fitting cell growth model (Monod) with 3 PDEs in R

Question

1 answers

solution1
0 2022-07-31 10:01:40

Fitting cell growth model (Monod) with 3 PDEs in R

Question

1 answers

solution1 0 2022-07-31 10:01:40

solution1
0 2022-07-31 10:01:40