R/computeOccupancy.R

Defines functions computeOccupancy

Documented in computeOccupancy

#######################################################################
# Functions
#######################################################################


computeOccupancy <- function(genomicProfiles ,
     parameterOptions=NULL,norm=TRUE,verbose=TRUE) {
    # Validity checking
    if(!.is.parameterOptions(parameterOptions) &
    !is.null(parameterOptions)){
    stop(paste0(deparse(substitute(parameterOptions)),
    "is not an occupancyProfileParamaters Object."))
    }
    if (!.is.genomicProfiles(genomicProfiles)){
    stop(paste0(deparse(substitute(genomicProfiles)),
    " is not a Genomic Profile Paramter object."))
    }

    #Generating parameterOptions if not given by user.
    #All Value will be defaut settings

    if(!is.null(parameterOptions)){
        genomicProfiles<-.updateGenomicProfiles(genomicProfiles,parameterOptions)
    }
    # GenomicProfiles parameter Extraction
  
    PWMGRList <- GRangesList(profiles(genomicProfiles))
    DNALength <- as.numeric(DNASequenceLength(genomicProfiles))
    averageExpPWMScore <- averageExpPWMScore(genomicProfiles)
    lambda <- lambdaPWM(genomicProfiles)

    ploidy <- as.numeric(ploidy(genomicProfiles))
    boundMolecules <- boundMolecules(genomicProfiles)
    backgroundSignal <- backgroundSignal(genomicProfiles)
    maxSignal <- maxSignal(genomicProfiles)



    # Computing Occupancy at sites higher than threshold
    MultiParam <- vector("list", (length(lambda)*length(boundMolecules)))
    PWMScore <- vector("list", length(PWMGRList))

    ### Essentially making sure that if regions dont have accessible DNA
    ## They will still be kept it will make things easier later down the line
    ## Also you just return a big fat falt line anyway

    dropLoci<-drop(genomicProfiles)
    if(dropLoci!="No loci dropped"){
      widthDisplay<-round(options()$width*0.5)
      cat("No Accessible DNA in: ",paste(rep(" ",
         times=(widthDisplay-nchar("StepSize: ")-nchar(dropLoci[1]))),collapse=''),
         dropLoci,"\n","\n")
      chr<-sapply(strsplit(dropLoci,":"),"[[",1)
      start<-sapply(strsplit(sapply(strsplit(dropLoci,":"),"[[",2),"\\.."),"[[",1)
      end<-sapply(strsplit(sapply(strsplit(dropLoci,":"),"[[",2),"\\.."),"[[",2)
      LocalDrop<-GRanges(seqnames=chr,ranges=IRanges(as.numeric(start), as.numeric(end)),
                          PWMScore=rep(0,length(chr)),
                          DNAaffinity=rep(0,length(chr)),
                          Occupancy=rep(0,length(chr)))
      name<-c(rep(names(PWMGRList),times=sapply(PWMGRList, length)),dropLoci)
    } else{
      name<-rep(names(PWMGRList),times=sapply(PWMGRList, length))
    }


    # chromatinState if not continuous Data

    Occupancy <- vector("list",length(PWMGRList))
    #names(Occupancy) <- names(PWMGRList)
    result <- list()
    emptyGR <- GRanges()
    # Progress message when required
    if(verbose){
    message("Computing Occupancy at sites higher than threshold. \n")
    }

    counter <- 0
    ParaVal <- c()

    #Computing Occupancy
    for(k in seq_along(lambda)){
        for(j in seq_along(boundMolecules)){

            PWMScore <- unlist(PWMGRList)$PWMScore

            Access <- unlist(PWMGRList)$DNAaffinity

            Occupancy <- rep(0,length(PWMScore))
            Occupancy <- (Access*boundMolecules[j]*exp((1/lambda[k])*PWMScore))/
                (Access*boundMolecules[j]*exp((1/lambda[k])*PWMScore) +
                DNALength*ploidy*averageExpPWMScore[k])

            Occupancy <- backgroundSignal + Occupancy*(maxSignal-backgroundSignal)
    # Normalising Ocupancy Signal
            if(norm == TRUE){
                maxOccupancy <- max(c(maxSignal,max(Occupancy)))
                Occupancy <- Occupancy/maxOccupancy
                ZeroBackground <- backgroundSignal/maxOccupancy
            } else {
                ZeroBackground <- backgroundSignal
            }


            buffer <- unlist(PWMGRList)

            buffer$Occupancy <- Occupancy
            if(dropLoci!="No loci dropped"){
               buffer<-c(buffer,LocalDrop)
            }
    # Extracting and pasting names of Parameters
            names(buffer) <- name
            if(length(name > 1)){
                level <- factor(names(buffer),levels=unique(name))
                result <- split(buffer,level)

            } else {
                result <-  buffer
            }

            counter <- counter+1
            MultiParam[[counter]] <- result
            ParaVal <- c(ParaVal,paste0("lambda = ",lambda[k]," & ",
            "boundMolecules = ",boundMolecules[j]))
        }
    }

    # ReBuilding GenomicProfileParameters
    names(MultiParam) <- ParaVal

    .ZeroBackground(genomicProfiles)<- ZeroBackground
    .profiles(genomicProfiles)<-MultiParam
    .tags(genomicProfiles)<-"Occupancy"
    .paramTag(genomicProfiles)<-"Occupancy"
    return(genomicProfiles)
}

Try the ChIPanalyser package in your browser

Any scripts or data that you put into this service are public.

ChIPanalyser documentation built on Nov. 8, 2020, 8:23 p.m.