Added fitted and residuals methods for cpt, cpt.reg, cpt.range classes.

rkillick · Oct 14, 2024 · fc13ed1 · fc13ed1
1 parent 5f95436
commit fc13ed1
Show file tree

Hide file tree

Showing 8 changed files with 213 additions and 70 deletions.
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -29,4 +29,3 @@ Author: Rebecca Killick [aut, cre],
   Paul Fearnhead [ctb, ths],
   Robin Long [ctb],
   Jamie Lee [ctr]
-RoxygenNote: 7.3.2
diff --git a/NAMESPACE b/NAMESPACE
@@ -6,7 +6,7 @@ import(stats)
 export("cpt.mean", "cpt.meanvar", "cpt.var","cpt.reg")
 export("BINSEG", "decision", "penalty_decision","PELT","class_input")
 exportClasses(cpt,cpt.reg,cpt.range)
-exportMethods(plot,summary,show,nseg,logLik,likelihood,data.set,data.set.ts,cpts,cpts.full, cpts.ts,cpttype,distribution,test.stat,
+exportMethods(plot,summary,show,nseg,logLik,likelihood,fitted,residuals,data.set,data.set.ts,cpts,cpts.full, cpts.ts,cpttype,distribution,test.stat,
 	method,ncpts,ncpts.max,param.est,param, coef,pen.type,pen.value,pen.value.full, minseglen, seg.len,"cpts<-","cpttype<-","data.set<-","distribution<-","test.stat<-","ncpts.max<-","param.est<-","pen.type<-",
 	"pen.value<-", "method<-", "cpts.full<-", "minseglen<-","pen.value.full<-")
 

diff --git a/NEWS b/NEWS
@@ -7,6 +7,7 @@ Version 2.3
 * Repeated code to calculate the cpts from a ncpts argument in cpt.range methods was removed.
 * The diagnostic plot for cpt.range objects (plot(object,diagnostic=TRUE)) has been changed to be more informative.  The axes have been swapped and instead of a line graph, a stepped graph is used which better reflects that you can't get fractional numbers of changepoints (type="s").  This can be overridden with another type if preferred.  Reworded the man file for plot-methods to reflect this change.
 * Added the upper bound on the tested penalty values to the pen.value.full slot for CROPS output.  Previously this was automatically removed and so you needed the original function call to know the upper bound that was tested.
+* Added fitted and residuals methods for cpt, cpt.reg, cpt.range classes.
 
 Version 2.2.5
 =============

diff --git a/R/cpt.class.R b/R/cpt.class.R
@@ -544,10 +544,9 @@ setClass("cpt",slots=list(data.set="ts", cpttype="character", method="character"
 	    param.est(object)=param.est
 	    return(object)
 	  }
-	  out=new('cpt.range')
-	  param.est(out)=param.est
-	  cpts(out)=cpts[-1] # keeps the n, not the 0
-	  return(out)
+	  param.est(object)=param.est
+	  cpts(object)=cpts[-1] # keeps the n, not the 0
+	  return(object)
 	})
 
 	setMethod("param", "cpt.reg", function(object,shape,...) {
@@ -560,6 +559,132 @@ setClass("cpt",slots=list(data.set="ts", cpttype="character", method="character"
 		return(object)
 	})
 
+
+# fitted functions
+  setMethod("fitted","cpt",function(object){
+    if(length(param.est(object))==0){# i.e. parameter.estimates=FALSE in call
+      cat('Calculating parameter estimates...')
+      object=param(object)
+      cat('done.\n')
+    }
+    if(cpttype(object)=="variance"){
+      means=param.est(object)$mean # fitting a constant to the data with changing mean
+      fitted=rep(means,length(data.set(object)))
+    }
+    else if(cpttype(object)=="mean"  ||  cpttype(object)=="mean and variance"){
+      #nseg=length(cpts(object))+1
+      cpts=c(0,object@cpts)
+      if((test.stat(object)=="Normal")||(test.stat(object)=="CUSUM")){
+        means=param.est(object)$mean
+      }
+      else if(test.stat(object)=="Gamma"){
+        means=param.est(object)$scale*param.est(object)$shape
+      }
+      else if(test.stat(object)=="Eobjectponential"){
+        means=1/param.est(object)$rate
+      }
+      else if(test.stat(object)=="Poisson"){
+        means=param.est(object)$lambda
+      }
+      else{
+        stop('Invalid Changepoint test statistic')
+      }
+      fitted=rep(means,seg.len(object))
+    }
+    else if(cpttype(object)=="trend"){
+      cpts=c(0,object@cpts)
+      intercept=rep(param.est(object)$thetaS,object@cpts-c(0,cpts(object)))
+      slope=rep(param.est(object)$thetaT-param.est(object)$thetaS,object@cpts-c(0,cpts(object)))/rep(object@cpts-c(0,cpts(object)),object@cpts-c(0,cpts(object)))
+      cptn=rep(c(0,cpts(object)),object@cpts-c(0,cpts(object)))
+      n=length(data.set(object))
+      fitted=intercept+slope*((1:n)-cptn)
+    }
+    else{
+      stop('Invalid Changepoint Type for fitted.\n Can only return fitted values for mean, variance, mean and variance')
+    }
+    return(fitted)
+  })
+
+	setMethod("fitted","cpt.range",function(object,ncpts=NA){
+	  if(is.na(ncpts)){
+	    if(length(param.est(object))==0){# i.e. parameter.estimates=FALSE in call
+	      cat('Calculating parameter estimates...')
+	      object=param(object)
+	      cat('done.\n')
+	    }
+	    cpts=c(0,object@cpts)
+	  }
+	  else{
+	    cpts=c(0,cpts(object,ncpts=ncpts),length(data.set(object)))
+	    object=param(object,ncpts=ncpts)
+	  }
+	  if(cpttype(object)=="variance"){
+	    means=param.est(object)$mean # fitting a constant to the data with changing mean
+	    fitted=rep(means,length(data.set(object)))
+	  }
+	  else if(cpttype(object)=="mean"  ||  cpttype(object)=="mean and variance"){
+	    #nseg=length(cpts(object))+1
+	    if((test.stat(object)=="Normal")||(test.stat(object)=="CUSUM")){
+	      means=param.est(object)$mean
+	    }
+	    else if(test.stat(object)=="Gamma"){
+	      means=param.est(object)$scale*param.est(object)$shape
+	    }
+	    else if(test.stat(object)=="Eobjectponential"){
+	      means=1/param.est(object)$rate
+	    }
+	    else if(test.stat(object)=="Poisson"){
+	      means=param.est(object)$lambda
+	    }
+	    else{
+	      stop('Invalid Changepoint test statistic')
+	    }
+	    fitted=rep(means,seg.len(object))
+	  }
+	  else if(cpttype(object)=="trend"){
+	    intercept=rep(param.est(object)$thetaS,object@cpts-c(0,cpts(object)))
+	    slope=rep(param.est(object)$thetaT-param.est(object)$thetaS,object@cpts-c(0,cpts(object)))/rep(object@cpts-c(0,cpts(object)),object@cpts-c(0,cpts(object)))
+	    cptn=rep(c(0,cpts(object)),object@cpts-c(0,cpts(object)))
+	    n=length(data.set(object))
+	    fitted=intercept+slope*((1:n)-cptn)
+	  }
+	  else{
+	    stop('Invalid Changepoint Type for fitted.\n Can only return fitted values for mean, variance, mean and variance')
+	  }
+	  return(fitted)
+	})
+
+	setMethod("fitted","cpt.reg",function(object){
+	  if(length(param.est(object))==0){# i.e. parameter.estimates=FALSE in call
+	    cat('Calculating parameter estimates...')
+	    object=param(object)
+	    cat('done.\n')
+	  }
+	  cpts=c(0,object@cpts)
+	  betas=param.est(object)$beta
+	  fitted=NULL
+	  for(i in 1:nseg(object)){
+	    fitted=c(fitted,betas[i,]%*%t(data.set(object)[(cpts[i]+1):cpts[i+1],-1]))
+	  }
+	  return(fitted)
+	})
+
+
+
+# residuals functions
+	setMethod("residuals","cpt",function(object){
+	  return(data.set(object)-fitted(object))
+	})
+	setMethod("residuals","cpt.reg",function(object){
+	  return(data.set(object)-fitted(object))
+	})
+	setMethod("residuals","cpt.range",function(object,ncpts=NA){
+	  return(data.set(object)-fitted(object,ncpts))
+	})
+
+
+
+
 # summary functions
 	setMethod("summary","cpt",function(object){
 	    cat("Created Using changepoint version",object@version,'\n')
@@ -618,51 +743,32 @@ setClass("cpt",slots=list(data.set="ts", cpttype="character", method="character"
 
 # plot functions
 	setMethod("plot","cpt",function(x,cpt.col='red',cpt.width=1,cpt.style=1,...){
+	  returnwhendone=FALSE
 	  if(length(param.est(x))==0){# i.e. parameter.estimates=FALSE in call
 	    cat('Calculating parameter estimates...')
-	    object=param(x)
+	    x=param(x)
 	    cat('done.\n')
+	    returnwhendone=TRUE
 	  }
 		plot(data.set.ts(x),...)
 		if(cpttype(x)=="variance" || cpttype(x)=="nonparametric (empirical_distribution)"){
 		  abline(v=index(data.set.ts(x))[cpts(x)],col=cpt.col,lwd=cpt.width,lty=cpt.style)
 		}
 		else if(cpttype(x)=="mean"  ||  cpttype(x)=="mean and variance"){
-			#nseg=length(cpts(x))+1
-			cpts=c(0,x@cpts)
-			if((test.stat(x)=="Normal")||(test.stat(x)=="CUSUM")){
-				means=param.est(x)$mean
-			}
-			else if(test.stat(x)=="Gamma"){
-				means=param.est(x)$scale*param.est(x)$shape
-			}
-			else if(test.stat(x)=="Exponential"){
-				means=1/param.est(x)$rate
-			}
-			else if(test.stat(x)=="Poisson"){
-			  means=param.est(x)$lambda
-			}
-			else{
-				stop('Invalid Changepoint test statistic')
-			}
-			for(i in 1:nseg(x)){
-				segments(index(data.set.ts(x))[cpts[i]+1],means[i],index(data.set.ts(x))[cpts[i+1]],means[i],col=cpt.col,lwd=cpt.width,lty=cpt.style)
-			}
+		  fitted=fitted(x)
+		  lines(index(data.set.ts(x)),fitted,type='s',col=cpt.col,lwd=cpt.width,lty=cpt.style)
 		}
 	  else if(cpttype(x)=="trend"){
 	    cpts=c(0,x@cpts)
-	    intercept=rep(param.est(x)$thetaS,x@cpts-c(0,cpts(x)))
-	    slope=rep(param.est(x)$thetaT-param.est(x)$thetaS,x@cpts-c(0,cpts(x)))/rep(x@cpts-c(0,cpts(x)),x@cpts-c(0,cpts(x)))
-	    cptn=rep(c(0,cpts(x)),x@cpts-c(0,cpts(x)))
-	    n=length(data.set(x))
-	    means=intercept+slope*((1:n)-cptn)
-	    for(i in 1:nseg(x)){
-	      segments(index(data.set.ts(x))[cpts[i]+1],means[cpts[i]+1],index(data.set.ts(x))[cpts[i+1]],means[cpts[i+1]],col=cpt.col,lwd=cpt.width,lty=cpt.style)
+	    fitted=fitted(x)
+	    for(i in 1:nseg(x)){ # still do this to not join at the changepoints
+	      segments(index(data.set.ts(x))[cpts[i]+1],fitted[cpts[i]+1],index(data.set.ts(x))[cpts[i+1]],fitted[cpts[i+1]],col=cpt.col,lwd=cpt.width,lty=cpt.style)
 	    }
 	  }
 		else{
 			stop('Invalid Changepoint Type for plotting.\n Can only plot mean, variance, mean and variance')
 		}
+		if(returnwhendone){return(x)}
 	})
 
 	setMethod("plot","cpt.range",function(x,ncpts=NA,diagnostic=FALSE,cpt.col='red',cpt.width=1,cpt.style=1,...){
@@ -683,42 +789,14 @@ setClass("cpt",slots=list(data.set="ts", cpttype="character", method="character"
 	    if(pen.type(x)=="CROPS"){
 	      stop('CROPS does not supply an optimal set of changepoints, set ncpts to the desired segmentation to plot or use diagnostic=TRUE to identify an appropriate number of changepoints')
 	    }
-	    cpts.to.plot=cpts(x)
-	    param.est=x
-	  }
-	  else{
-	    cpts.to.plot=cpts(x,ncpts=ncpts)
-	    if(test.stat(x)=="Gamma"){
-	      param.est=param(x,ncpts,shape=param.est(x)$shape)
-	    }
-	    else{
-	      param.est=param(x,ncpts)
-	    }
 	  }
 	  if(cpttype(x)=="variance"){
-	    abline(v=index(data.set.ts(x))[cpts.to.plot],col=cpt.col,lwd=cpt.width,lty=cpt.style)
+	    cpts=cpts(x,ncpts=ncpts)
+	    abline(v=index(data.set.ts(x))[cpts],col=cpt.col,lwd=cpt.width,lty=cpt.style)
 	  }
 	  else if(cpttype(x)=="mean"  ||  cpttype(x)=="mean and variance"){
-	    if((test.stat(x)=="Normal")||(test.stat(x)=="CUSUM")){
-	      means=param.est(param.est)$mean
-	    }
-	    else if(test.stat(x)=="Gamma"){
-	      means=param.est(param.est)$scale*param.est(param.est)$shape
-	    }
-	    else if(test.stat(x)=="Exponential"){
-	      means=1/param.est(param.est)$rate
-	    }
-	    else if(test.stat(x)=="Poisson"){
-	      means=param.est(param.est)$lambda
-	    }
-	    else{
-	      stop('Invalid Changepoint test statistic')
-	    }
-	    nseg=length(means)
-	    cpts.to.plot=c(0,cpts.to.plot,length(data.set(x)))
-	    for(i in 1:nseg){
-	      segments(index(data.set.ts(x))[cpts.to.plot[i]+1],means[i],index(data.set.ts(x))[cpts.to.plot[i+1]],means[i],col=cpt.col,lwd=cpt.width,lty=cpt.style)
-	    }
+	    fitted=fitted(x,ncpts=ncpts)
+	    lines(index(data.set.ts(x)),fitted,type='s',col=cpt.col,lwd=cpt.width,lty=cpt.style)
 	  }
 	  else{
 	    stop('Invalid Changepoint Type for plotting.\n Can only plot mean, variance, mean and variance')
@@ -734,9 +812,9 @@ setClass("cpt",slots=list(data.set="ts", cpttype="character", method="character"
 	  plot(data.set(x)[,1],type='l',...)
 	  if(test.stat(x)=="Normal"){
 	    cpts=c(0,x@cpts)
-	    betas=param.est(x)$beta
+	    fitted=fitted(x)
 	    for(i in 1:nseg(x)){
-	      lines((cpts[i]+1):cpts[i+1],betas[i,]%*%t(data.set(x)[(cpts[i]+1):cpts[i+1],-1]),col=cpt.col,lwd=cpt.width,lty=cpt.style)
+	      lines((cpts[i]+1):cpts[i+1],fitted[(cpts[i]+1):cpts[i+1]],col=cpt.col,lwd=cpt.width,lty=cpt.style)
 	    }
 	  }
 	  else{

diff --git a/changepoint.Rproj b/changepoint.Rproj
@@ -19,4 +19,3 @@ BuildType: Package
 PackageUseDevtools: Yes
 PackageInstallArgs: --no-multiarch --with-keep.source
 PackageCheckArgs: --as-cran --no-tests
-PackageRoxygenize: rd,collate,namespace
diff --git a/man/fitted-methods.Rd b/man/fitted-methods.Rd
@@ -0,0 +1,33 @@
+\name{fitted-methods}
+\docType{methods}
+\alias{fitted-methods}
+\alias{fitted,ANY-method}
+\alias{fitted,cpt-method}
+\alias{fitted,cpt.range-method}
+\alias{fitted,cpt.reg-method}
+\title{ ~~ Methods for Function fitted in Package `stats' ~~}
+\description{
+ ~~ Methods for function \code{fitted} in Package `stats' ~~
+}
+\section{Methods}{
+\describe{
+
+\item{\code{signature(x = "ANY")}}{
+	Generic fitted function, see stats package description using ?fitted
+}
+
+\item{\code{signature(x = "cpt")}}{
+	Returns the fitted values for the model fit to x.  Adapts to the specific model type.
+}
+\item{\code{signature(x = "cpt.range")}}{
+	As for the \code{cpt} objects except for one optional arguments, \code{ncpts}.  The \code{ncpts} option allows you to specify the fitted values for \code{ncpts} changepoints in, i.e. the optimal may be specified as 10 changes but you want to get the fitted values for the segmentation with 5 changes (provided a segmentation with 5 changes is listed in \code{cpts.full(x)}.
+}
+\item{\code{signature(x = "cpt.reg")}}{
+	Returns the fitted values for the model fit to x.  Adapts to the specific model type.
+}
+
+}}
+\keyword{methods}
+\keyword{fitted}
+\keyword{cpt}
+\keyword{internal}
diff --git a/man/plot-methods.Rd b/man/plot-methods.Rd
@@ -23,7 +23,7 @@
 	As for the \code{cpt} objects except for two optional arguments, \code{ncpts} and \code{diagnostic}.  The \code{ncpts} option allows you to specify a plot of the segmentation with \code{ncpts} changepoints in, i.e. the optimal may be specified as 10 changes but you want to plot the segmentation with 5 changes (provided a segmentation with 5 changes is listed in \code{cpts.full(x)}.  The \code{diagnostic} option when set to \code{TRUE} plots the number of changepoints in each segmentation against the penalty values that give that number of changepoints.  This can aide the decision on the number of changepoints as when a true changepoint is added the cost decreases considerably so it creates a stable region where several penalty values give the same number of changepoints, but when a changepoint due to noise is added the change in cost is small and so a small change in penalty value can vary the number of changes a lot.  This is akin to a scree plot in principal component analysis.  The idea is that someone may choose to create a plot using \code{diagnostic=TRUE}, identify the appropriate number of changes and then replot using \code{ncpts} to visualize that segmentation.
 }
 \item{\code{signature(x = "cpt.reg")}}{
-	Plotting is only valid for one regressor.  Plots the regressor against the response and identifies the changepoints using horizontal lines.  Optional arguments to control the lines: \code{cpt.col} equivilent to \code{col} to change the colour of the changepoint line; \code{cpt.width} equivilent to \code{lwd} to change the width of the changepoint line; \code{cpt.style} equivilent to \code{lty} to change the style of the line.
+	Plots the combined regressors against the response and identifies the changepoints using vertical lines.  Optional arguments to control the lines: \code{cpt.col} equivilent to \code{col} to change the colour of the changepoint line; \code{cpt.width} equivilent to \code{lwd} to change the width of the changepoint line; \code{cpt.style} equivilent to \code{lty} to change the style of the line.
 }
 
 }}

diff --git a/man/residuals-methods.Rd b/man/residuals-methods.Rd
@@ -0,0 +1,33 @@
+\name{residuals-methods}
+\docType{methods}
+\alias{residuals-methods}
+\alias{residuals,ANY-method}
+\alias{residuals,cpt-method}
+\alias{residuals,cpt.range-method}
+\alias{residuals,cpt.reg-method}
+\title{ ~~ Methods for Function residuals in Package `stats' ~~}
+\description{
+ ~~ Methods for function \code{residuals} in Package `stats' ~~
+}
+\section{Methods}{
+  \describe{
+
+    \item{\code{signature(x = "ANY")}}{
+      Generic residuals function, see stats package description using ?residuals
+    }
+
+    \item{\code{signature(x = "cpt")}}{
+      Returns the residuals values from the model fit to x.  Adapts to the specific model type.
+    }
+    \item{\code{signature(x = "cpt.range")}}{
+      As for the \code{cpt} objects except for one optional arguments, \code{ncpts}.  The \code{ncpts} option allows you to specify the residuals values for \code{ncpts} changepoints in, i.e. the optimal may be specified as 10 changes but you want to get the residuals values for the segmentation with 5 changes (provided a segmentation with 5 changes is listed in \code{cpts.full(x)}.
+    }
+    \item{\code{signature(x = "cpt.reg")}}{
+      Returns the residuals values from the model fit to x.  Adapts to the specific model type.
+    }
+
+  }}
+\keyword{methods}
+\keyword{residuals}
+\keyword{cpt}
+\keyword{internal}