R/InternalFrequency_SVMerge.r

Defines functions internalFrequencyTrio_Duo

Documented in internalFrequencyTrio_Duo

#' Calculates the internal frequencies of SV in internal cohorts,
#' for SVMerge
#'
#' @param mergedFiles  character. Path to the merged SV files.
#' @param smappath  character. path to the query smap file.
#' @param smap  character. File name for the smap
#' @param smapdata  character. Dataframe if input type chosen as dataframe.
#' @param buildSVInternalDB  boolean. Checking whether the merged solo 
#' file database exist.
#' @param input_fmt_SV Format in which data 
#' is provided as an input to thefunction.
#' @param path  character. Path to the solo file database.
#' @param pattern  character. pattern of the file names to merge.
#' @param outpath  character. Path to merged SV solo datasets.
#' @param dbOutput  character. Output of merged bionano data.
#' @param fname  character. Filename in case dbOutput = Text.
#' @param win_indel  N umeric. Insertion and deletion error window.
#' Default 10000.
#' @param win_inv_trans  Numeric. Inversion and translocation error window.
#' Default 50000.
#' @param perc_similarity  Numeric . ThresholdPercentage similarity 
#' of the query SV and reference SV. Default 0.5.
#' @param perc_similarity_parents  Numeric . ThresholdPercentage similarity 
#' for zygosity determination. Default 0.9.
#' @param EnzymeType Character. Type of enzyme. Options Dual and DLE.
#' @param indelconf  Numeric. Threshold for insertion and deletion confidence.
#' Default 0.5
#' @param invconf  Numeric. Threshold for inversion confidence.Default 0.01.
#' @param transconf  Numeric. Threshold for translocation confidence. 
#' Default 0.1.
#' @param limsize Numeric. Minimum size of SV that can be determined 
#' acurately by the Bionano SV caller. Default 1000.
#' @param win_indel_parents  Numeric. Insertion and deletion error window to 
#' determine zygosity in case of parents. Default 5000.
#' @param win_inv_trans_parents  Numeric. Inversion and translocation error 
#' window to determine zygosity in case of parents. Default 40000.
#' @param indexfile File containing connection between sample and nanoIDs
#' @param labelType character. Type of labels used for mapping. 
#'        Choices are Dual, DLE and Both.
#' @param SVMerge_path    character. Path for the Dual labelled cmap
#' @param SVMerge_pattern    character. pattern of the dual files.
#' @param SE_path    character. Path for the Dual labelled cmap
#' @param SE_pattern    character. pattern of the dual files.
#' @param Samplecodes character. File containing relations and IDs 
#' associated to them.
#' @param mergeKey character. File containing sample ID and relation.
#' @param outpath character. Path where the merged samples are kept.
#' @param mergedKeyoutpath character. File path storing sample name and nanoID
#'        key information.
#' @param mergedKeyFname character. File name storing sample name and nanoID
#'        key information.
#' @param returnMethod character. Choice between Text and DataFrame.
#' @param returnMethod character. Choice between Text and DataFrame.
#' Required if you want to calculate internal frequency.
#' @return Calculated internal frequency in dataframe or text.
#' @examples
#' smapName="GM24385_Ason_DLE1_VAP_trio5.smap"
#' smap = system.file("extdata", smapName, package="nanotatoR")
#' indelconf = 0.5; invconf = 0.01;transconf = 0.1;input_fmt_SV="Text";
#' datInf <- internalFrequency_solo( smap = smap, 
#' buildSVInternalDB = FALSE, win_indel=10000, 
#' win_inv_trans=50000, EnzymeType = "SE",
#' mergedFiles = system.file("extdata", "nanotatoRControl.txt", package="nanotatoR"), 
#' perc_similarity_parents =0.9,
#' indexfile = system.file("extdata", "Sample_index.csv", package="nanotatoR"),
#' perc_similarity=0.5, indelconf=0.5, invconf=0.01, 
#' transconf=0.1, limsize=1000, win_indel_parents=5000,input_fmt="Text",
#' win_inv_trans_parents=40000,
#' returnMethod="dataFrame", input_fmt_SV = "Text")
#' @importFrom stats na.omit 
#' @import tidyverse
#' @import hash
#' @importFrom rlang .data
#' @importFrom dplyr mutate group_by summarise
#' @export
internalFrequencyTrio_Duo <- function(mergedFiles, smappath , smap , 
    buildSVInternalDB=FALSE, smapdata, 
    path, pattern, outpath, win_indel=10000, win_inv_trans=50000, 
    perc_similarity=0.5, indelconf=0.5, invconf=0.01, fname, 
    limsize=1000, win_indel_parents=5000,win_inv_trans_parents=40000, 
    transconf=0.1, dbOutput =c("dataframe","text"),
    perc_similarity_parents=0.9,
    returnMethod=c("Text","dataFrame"),
    input_fmt_SV=c("Text","dataFrame"),
    indexfile,
    EnzymeType = c("SVmerge", "SE"),
    labelType = c("SVMerge", "SE", "Both"),
    SVMerge_path ,SVMerge_pattern , 
    SE_path , SE_pattern,
    Samplecodes ,mergeKey,
    mergedKeyoutpath, mergedKeyFname){
    #library(hash)

    print("###Calculating the Internal Frequency###")
    if(buildSVInternalDB == TRUE){
        r <- merging_SE_SVMerge(
            labelType = labelType, 
            SVMerge_path = SVMerge_path, 
            SVMerge_pattern = SVMerge_pattern, 
            SE_path = SE_path, 
            SE_pattern = SE_pattern, 
            Samplecodes = Samplecodes, 
            mergeKey = mergeKey, 
            mergedKeyoutpath = mergedKeyoutpath,
            mergedKeyFname = mergedKeyFname,
            outputMode = "dataframe")
    }
    else{
        r <- read.table(mergedFiles, sep = "\t", header = TRUE)
    }
    usamp <- length(unique(r$nanoID))
    if(input_fmt_SV=="dataFrame"){
        smapdata = smapdata
        if(EnzymeType == "SVMerge"){
            #smapdata <- readSMap(smap, input_fmt_smap = "Text")
            SVID <- smapdata$SVIndex
        }
        else{
            #smapdata <- readSMap_DLE(smap, input_fmt_smap)
            SVID <- smapdata$SmapEntryID
        }
    }
    else if(input_fmt_SV=="Text"){
        if(EnzymeType == "SVMerge"){
            smapdata <- readSMap(smap, input_fmt_smap = "Text")
            SVID<-smapdata$SVIndex
        }
        else{
            smapdata <- readSMap_DLE(smap, input_fmt_smap = "Text")
            SVID<-smapdata$SmapEntryID
        }
    }
    else{
        stop("Input format for SMAP Incorrect")
    }
    r1 <- smapdata
    sampID <- str_squish(as.character(unique(r1$SampleID)))
    
    ufam <- as.character(unique(r$nanoID))
    famid <- c()
    for (qp in seq_len(length(ufam)))
    {
        stt <- strsplit(ufam[[qp]][1], split = "[.]")
        famid <- c(famid, as.character(stt[[1]][1]))
    }
    datf1 <- data.frame(table(famid))
    ha <- hash()
    .set(ha, keys = as.character(datf1$famid), 
        values = as.character(datf1$Freq))
    ## Checking Sex male/female and assigning chromosome number accordingly
    chro1 <- sort(unique(r1$RefcontigID1))
    #chro1 <- c(1:chro)
    dataFinal <- c()
    for (ii in seq_along(chro1))
    {
       
        dat <- r[which(r$RefcontigID1 == chro1[ii]), ]
        
        # variantType1<-dat$variantsubtype Changing the variant terms in DGV to
        # match svmap
        variantType1 <- dat$Type
        BSPQI_status_DB <- as.character(dat$Found_in_self_BSPQI_molecules)
        BSSSI_status_DB <- as.character(dat$Found_in_self_BSSSI_molecules)
        ## Extracting data from SVmap
        dat1 <- r1[which(r1$RefcontigID1 == chro1[ii]), ]
        chromo2<-dat1$RefcontigID2
        ## Adding the windows to the breakpoints
        rf <- dat1$RefStartPos
        rf_wb_ind <- rf - win_indel
        rf_fb_ind <- rf + win_indel
        rf_wb_int <- rf - win_inv_trans
        rf_fb_int <- rf + win_inv_trans
        re <- dat1$RefEndPos
        re_wf_ind <- re + win_indel
        re_wb_ind <- re - win_indel
        re_wb_int <- re - win_inv_trans
        re_fb_int <- re + win_inv_trans
        ## Calculating size
        size_bn <- dat1$Size
        conf1 <- dat1$Confidence
        variantType2 <- as.character(dat1$Type)
        ###Parents Zygosity check
        'win_indel_parents<-as.numeric(win_indel_parents[oo])
        win_inv_trans_parents<- as.numeric(win_inv_trans_parents[oo])
        perc_similarity_parents<-as.numeric(perc_similarity_parents[oo])'
        #win_indel_parents<-as.numeric(win_indel_parents)
        #win_inv_trans_parents<- as.numeric(win_inv_trans_parents)
        'win_inv_trans_parents<- as.numeric(win_inv_trans_parents[oo])'
        #perc_similarity_parents<-as.numeric(perc_similarity_parents)
        rf_wb_ind_parents <- rf - win_indel_parents
        rf_fb_ind_parents <- rf + win_indel_parents
        rf_wb_int_parents <- rf - win_inv_trans_parents
        rf_fb_int_parents <- rf + win_inv_trans_parents
        #re <- dat1$RefEndPos
        re_wf_ind_parents <- re + win_indel_parents
        re_wb_ind_parents <- re - win_indel_parents
        re_wb_int_parents <- re - win_inv_trans_parents
        re_fb_int_parents <- re + win_inv_trans_parents
        # svfam<-as.character(dat1$SVIdentifier)
        #print(indexfile)
        if(buildSVInternalDB == FALSE){
            famindexfile <-read.csv(indexfile)
        }        else{
            famindexfile <- read.csv(file.path(
                mergedKeyoutpath = mergedKeyoutpath, 
                mergedKeyFname = mergedKeyFname))
            }
        ha1 <- hash()
        .set(ha1, keys = famindexfile$SampleID, values =  famindexfile$NID)
        val1 <-as.character(hash::values(ha1, keys = sampID))
        stt1 <- strsplit(val1, split = "\\.")
        patID <- stt1[[1]][2]
        svfamid <- stt1[[1]][1]
        ha2 <- hash()
        .set(ha2, keys = famindexfile$SampleID, values = famindexfile$Tag)
        'if((length(grep("\\\\",smap))>=1)){
            spl<-strsplit(as.character(smap), split = "\\\\")
            lenspll1<-length(spl[[1]])
            spl1 <- strsplit(as.character(spl[[1]][lenspll1]), split = "_")
            # svfamid<-as.character(spl1[[1]][2])
            spl2 <- strsplit(as.character(spl1[[1]][1]), split = "[.]")
            patID <- spl2[[1]][2]
            svfamid <- spl2[[1]][1]
        }
        else if((length(grep("/",smap))>=1)){
            spl<-strsplit(as.character(smap), split = "/")
            lenspll1<-length(spl[[1]])
            spl1 <- strsplit(as.character(spl[[1]][lenspll1]), split = "_")
            # svfamid<-as.character(spl1[[1]][2])
            spl2 <- strsplit(as.character(spl1[[1]][1]), split = "[.]")
            patID <- spl2[[1]][2]
            svfamid <- spl2[[1]][1]
        }
        else{
            spl1 <- strsplit(as.character(smap), split = "_")
            # svfamid<-as.character(spl1[[1]][2])
            spl2 <- strsplit(as.character(spl1[[1]][1]), split = "[.]")
            patID <- spl2[[1]][2]
            svfamid <- spl2[[1]][1]
        }'
        # svind<-dat1$SVIndex
        bsssi<-c()
        bspqi<-c()
        rest<-c()
        # conf<-dat$Confidence countfre<-0 percn<-c()
        datf <- c()
        print(paste('Chrom:',ii,sep=''))
        #for (nn in 1:20)
        for (nn in seq_along(rf))
        {
            
            #print(paste("nn:",nn)) 
           
            if ((variantType2[nn] == "deletion" | 
                variantType2[nn] == "insertion")){ 
                        
                dat2 <-dat[which((dat$RefStartPos >= rf_wb_ind[nn] 
                            & dat$RefEndPos <= re_wf_ind[nn])),]
                    
                size1 <- size_bn[nn]
                ## Calculating Internal Frequency
                if (nrow(dat2) > 1)
                {
                    dat2$perc_ref_query <- as.numeric(dat2$Size)/size1
                    dat2$perc_query_ref <- size1/as.numeric(dat2$Size)
                    stt12 <- str_split(as.character(dat2$nanoID), 
                        pattern = "\\.")
                    famid <- c(); relnid <- c()
                    
                    'for(ee in seq_along(stt12)){
                        famid <- c(famid, as.character(stt12[[ee]][1]))
                        relnid <- c(relnid, as.character(stt12[[ee]][2]))
                    }
                    '
                    dat2$FamilyID <- sapply(stt12, function(x) x[1])
                    dat2$RelationID <- sapply(stt12, function(x) x[2])
                    dat2MomEqual <- dat2[which(((dat2$RefStartPos == rf[nn]) 
                        & (dat2$RefEndPos==re[nn])) 
                        & (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1 & 
                        dat2$RelationID == 2)),]
                    dat2DadEqual <- dat2[which(((dat2$RefStartPos ==rf[nn]) & 
                        (dat2$RefEndPos==re[nn])) & 
                        (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn]) 
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1 
                        & dat2$RelationID == 3)),]
                    dat2MomRange <- dat2[which(((
                        dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                        & (dat2$RefEndPos <= re_fb_int_parents[nn]))
                        & (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1
                        & dat2$RelationID == 2)),]
                    'dat2MomRange <- subset(dat2,((((RefStartPos <= rf[nn] & 
                        RefStartPos >= rf_wb_ind_parents[nn]) | 
                        (RefStartPos >= rf[nn] & RefStartPos <= rf_wb_ind_parents[nn])) 
                        & ((RefEndPos >= re[nn] & RefStartPos <= re_wf_ind_parents[nn]) 
                        | (RefEndPos <= re[nn] & dat2$RefEndPos >= re_wf_ind_parents[nn]))) 
                        & (dat2$perc >= perc_similarity) 
                        & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2)))'
                    dat2DadRange <- dat2[which(((
                        dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                        & (dat2$RefEndPos <= re_fb_int_parents[nn]))
                        & (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1 
                        & dat2$RelationID == 3)),]
                    dat2Frequency <- dat2[which((
                        dat2$perc_ref_query >= perc_similarity 
                        & dat2$perc_query_ref >= perc_similarity) 
                        & (dat2$Size >= limsize)
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) != svfamid)
                        & (dat2$Confidence >= indelconf)
                        & ((dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "no" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "no") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "-") 
                        | (dat2$Found_in_self_BSPQI_molecules == "-" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes")
                        | (dat2$Found_in_SE_self_molecules == "yes"))
                        & ((dat2$Type1 =="insertion" & dat2$Type2 =="insertion") 
                        | (dat2$Type1 =="insertion" & is.na(dat2$Type2)) 
                        | (is.na(dat2$Type1) & dat2$Type2 =="insertion") 
                        | (dat2$Type1 == "deletion" & dat2$Type2 == "deletion") 
                        | (dat2$Type1 == "deletion" & is.na(dat2$Type2)) 
                        | (is.na(dat2$Type1) & dat2$Type2 =="deletion")
                        | (dat2$Type1 == "-" 
                        & dat2$Type2 == "-" & dat2$Type == "deletion")
                        | (dat2$Type1 == "-" 
                        & dat2$Type2 == "-" & dat2$Type == "insertion"))),]
                    dat2UnfilteredFrequency <- dat2[which((
                        dat2$perc_ref_query >= perc_similarity & 
                        dat2$perc_query_ref >= perc_similarity)
                        & (as.character(dat2$FamilyID) != svfamid)
                        & (as.character(dat2$Type) == variantType2[nn])),]
                         
                    
                    
                    'countfre <- c();countfreunfilt<-c()
                    sv1 <- dat2$nanoID
                    
                    # svind1<-dat2$SVIndex
                    #sv1 <- strsplit(as.character(svfam1), split = "_")
                    size_internal <- dat2$Size
                    zygo <- as.character(dat2$Zygosity)
                    type <- as.character(dat2$Type)
                    typ1 <- as.character(dat2$Type1)
                    typ2 <- as.character(dat2$Type2)
                    #svid <- as.numeric(dat2$SVIndex)
                    \'if (length(grep("SVIndex",names(smap)))>0){
                        svid <- dat2$SVIndex
                    }
                    else{
                        svid <- dat2$SmapEntryID
                    }\'
                    BSPQI_status_DB <- 
                        as.character(dat2$Found_in_self_BSPQI_molecules)
                    BSSSI_status_DB <- 
                        as.character(dat2$Found_in_self_BSSSI_molecules)
                    svStrt<-as.numeric(dat2$RefStartPos)
                    svEnd<-as.numeric(dat2$RefEndPos)
                    type1<-as.character(dat2$Type1)
                    type2<-as.character(dat2$Type2)
                    conf <- dat2$Confidence
                    motherZygosity <- c()
                    fatherZygosity <- c()
                    motherZygosity_exact <- c()
                    fatherZygosity_exact <- c()
                    svfamid3 <- c()
                    svfamid3_unfilt <- c()
                    bsssi<-c()
                    bs_bq<-c()
                    bspqi<-c()
                    svSAMP<-c()
                    svSAMP_unfiltered<-c()
                    homozygo<-c()
                    for (ll in seq_len(nrow(dat2))){
                        perc <- (size1/size_internal[ll])
                        print(perc)
                        print (sv1[ll])
                        #### print(perc) print(type[ll])
                        stt <- strsplit(as.character(sv1[ll]), split = "[.]")
                        patID1 <- stt[[1]][2]
                        svfamid1 <- stt[[1]][1]
                        #### print(svfamid1)
                        ###Filtered INDEL
                        ##Check whether the parents have same breakpoints 
                        ##as the proband
                    
                        
                        if (((svStrt[ll]==rf[nn]) & (svEnd[ll]==re[nn])) & 
                            (perc_ref_query >= perc_similarity & perc_query_ref >= perc_similarity) & 
                            identical(type[ll], variantType2[nn]) & 
                            (identical(svfamid1, svfamid))){
                            # Family Extra column zygosity
                            if (patID == 1 & patID1 == 2){
                          
                                # svfamid3<-c(svfamid3,svfamid1)
                                motherZygosity_exact <- c(motherZygosity_exact,
                                    as.character(zygo[ll]))
                                fatherZygosity_exact <- c(fatherZygosity_exact, 
                                    NULL)
                            } 
                            else if (patID == 1 & patID1 == 3){
                                
                                motherZygosity_exact <- c(motherZygosity_exact,
                                    NULL)
                                fatherZygosity_exact <- c(fatherZygosity_exact,
                                    as.character(zygo[ll]))
                            }   
                            else if (patID == patID1){
                                motherZygosity_exact <- c(motherZygosity_exact,
                                    NULL)
                                fatherZygosity_exact <- c(fatherZygosity_exact,
                                    NULL)
                            } 
                            else{
                                # svfamid3<-c(svfamid3,svfamid1)
                          
                                motherZygosity_exact <- c(motherZygosity_exact,
                                    NULL)
                                fatherZygosity_exact <- c(fatherZygosity_exact,
                                    NULL)
                            }
                        } 
                        else if ((perc_ref_query >= perc_similarity & perc_query_ref >= perc_similarity) & 
                            identical(type[ll], variantType2[nn]) & 
                            (identical(svfamid1, svfamid)) & 
                            ((( svStrt[ll] <= rf[nn] & 
                            svStrt[ll] >= rf_wb_ind_parents[nn]) | 
                            (svStrt[ll] >= rf[nn] & 
                            svStrt[ll] <= rf_fb_ind_parents[nn])) & 
                            ((svEnd[ll] >= re[nn] & 
                            svEnd[ll] <= re_wf_ind_parents[nn]) |
                            (svEnd[ll] <= re[nn] & 
                            svEnd[ll] >= re_wb_ind_parents[nn])))
                            ){
                            #Family Extra column zygosity
                                if (patID == 1 & patID1 == 2){
                        
                                    # svfamid3<-c(svfamid3,svfamid1)
                                    motherZygosity <- c(motherZygosity, 
                                        as.character(zygo[ll]))
                                    fatherZygosity <- c(fatherZygosity, NULL)
                                } 
                                else if (patID == 1 & patID1 == 3){
                                    
                                    motherZygosity <- c(motherZygosity, NULL)
                                    fatherZygosity <- c(fatherZygosity, 
                                        as.character(zygo[ll]))
                                } 
                                else if (patID == patID1){
                         
                                    motherZygosity <- c(motherZygosity, NULL)
                                    fatherZygosity <- c(fatherZygosity, NULL)
                                } 
                                else {
                                    # svfamid3<-c(svfamid3,svfamid1)
                        
                                    motherZygosity <- c(motherZygosity, NULL)
                                    fatherZygosity <- c(fatherZygosity, NULL)
                                }
                            }
                            else if ((perc_ref_query >= perc_similarity & perc_query_ref >= perc_similarity) & 
                                (identical(type[ll], variantType2[nn])) &
                                ((size_internal[ll]>=limsize)) & 
                                !(identical(svfamid1, svfamid)) & 
                                (conf[ll] >= indelconf) & 
                                ((BSPQI_status_DB[ll] == "yes" & 
                                BSSSI_status_DB[ll] == "yes") 
                                | (BSPQI_status_DB[ll] == "no" & 
                                BSSSI_status_DB[ll] == "yes") | 
                                (BSPQI_status_DB[ll] == "yes" & 
                                BSSSI_status_DB[ll] == "no") | 
                                (BSPQI_status_DB[ll] == "yes" & 
                                BSSSI_status_DB[ll] == "-") | 
                                (BSPQI_status_DB[ll] == "-" & 
                                BSSSI_status_DB[ll] == "yes")) & 
                                ((typ1[ll]=="insertion" & 
                                typ2[ll]=="insertion") | 
                                (typ1[ll]=="insertion" & is.na(typ2[ll])) |
                                (is.na(typ1[ll]) & typ2[ll]=="insertion") | 
                                (typ1[ll]=="deletion" & typ2[ll]=="deletion") |
                                (typ1[ll]=="deletion" & is.na(typ2[ll])) | 
                                (is.na(typ1[ll]) & typ2[ll]=="deletion"))
                                ) {
                                #print ("Not in the same family")
                                countfre <- c(countfre,1)
                                print(countfre)
                                svfamid3 <- c(svfamid3, as.character(sv1[ll]))
                                motherZygosity <- c(motherZygosity, "-")
                                fatherZygosity <- c(fatherZygosity, "-")
                                svSAMP<-c(svSAMP,ll)
                                if(as.character(zygo[ll])=="homozygous"){
                                    homozygo<-c(homozygo, 
                                    as.character((sv1[ll])))
                                }
                                else{
                                    homozygo<-c(homozygo, NULL)
                                }
                            }
                            else{
                                
                                motherZygosity <- c(motherZygosity, "-")
                                fatherZygosity <- c(fatherZygosity, "-")     
                            }
                            ###Unfiltered INDEL
                           if (perc >= perc_similarity & 
                                identical(type[ll], variantType2[nn]) &
                                !(identical(svfamid1, svfamid))){
                                countfreunfilt <- c(countfreunfilt,1)
                                svfamid3_unfilt <- c(svfamid3_unfilt, 
                                    as.character(sv1[ll]))
                                svSAMP_unfiltered<-c(svSAMP_unfiltered,ll)
                            }
                            else{
                               \'print ("SVs does not meet the unfiltered 
                                    criteria!!!")\'
                            }
                      
                     
                    
                        }'
                    ##Filtered
                    if (is.null(dat2Frequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }else if (nrow(dat2Frequency) > 0){
                        dat2Homozygotes <- data.frame(dat2Frequency %>% 
                            mutate(Homozygo = .data$Zygosity=="homozygous") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Homozygotes = sum(.data$Homozygo)))
                        cntHomozygotes <- sum(dat2Homozygotes$Homozygo)
                        dat2Homozygotes [,2] <- ifelse(
                                dat2Homozygotes[,2] > 0, 2, 0
                                )
                        dat2Heterozygotes <- data.frame(
                                dat2Frequency 
                                %>%     mutate(
                                Heterozygo = .data$Zygosity == "heterozygous"
                                ) 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Heterozygotes = sum(.data$Heterozygo
                        )))
                        dat2Heterozygotes [,2] <- ifelse(
                                    dat2Heterozygotes[,2] > 0, 1, 0
                                    )
                        dat2Unknown <- data.frame(dat2Frequency 
                        %>%     mutate(Unknown = .data$Zygosity == "unknown") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Unknown = sum(.data$Unknown)))
                        dat2Unknown [,2] <- ifelse(
                                dat2Unknown[,2] > 0, 2, 0
                                )
                        dat2filtFreq <- data.frame(
                                NR = dat2Homozygotes[,1], 
                                Homozygote = dat2Homozygotes[,2],
                                Heterozygotes = dat2Heterozygotes[,2], 
                                Unknown = dat2Unknown[,2])
                        row.names(dat2filtFreq) <- as.character(
                                dat2Homozygotes[,1])
                        dat2filtFreq$RowSum <- ifelse(
                                (dat2filtFreq$Heterozygotes ==1 
                                & (dat2filtFreq$Homozygote == 0 
                                & dat2filtFreq$Unknown == 0)), 1, 2)
                        filtFreq <- sum(dat2filtFreq$RowSum)
                    }else{
                            filtFreq  = 0
                            cntHomozygotes = 0
                        }
                        
                    
                    ###Unfiltered
                    if (is.null(dat2UnfilteredFrequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }else if (nrow(dat2UnfilteredFrequency) > 0){
                        dat2Homozygotes <- data.frame(
                            dat2UnfilteredFrequency 
                            %>%     mutate(Homozygo=.data$Zygosity=="homozygous") 
                            %>%     group_by(.data$nanoID) 
                            %>%     summarise (Homozygotes = sum(.data$Homozygo)))
                        #cntHomozygotes <- sum(dat2Homozygotes$Homozygotes)
                        dat2Homozygotes [,2] <- ifelse(
                                dat2Homozygotes[,2] > 0, 2, 0
                                )
                        dat2Heterozygotes <- data.frame(
                                    dat2UnfilteredFrequency 
                                    %>%     mutate(
                                    Heterozygo = .data$Zygosity == "heterozygous") 
                                    %>%     group_by(.data$nanoID) 
                                    %>%     summarise (Heterozygotes = sum(.data$Heterozygo)))
                        dat2Heterozygotes [,2] <- ifelse(
                                        dat2Heterozygotes[,2] > 0, 1, 0
                                        )
                        dat2Unknown <- data.frame(dat2UnfilteredFrequency 
                        %>%     mutate(Unknown = .data$Zygosity == "unknown") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Unknown = sum(.data$Unknown)))
                        dat2Unknown [,2] <- ifelse(
                                dat2Unknown[, 2] > 0, 2, 0
                                )
                        dat2unfiltFreq <- data.frame(
                                    Homozygote = dat2Homozygotes[,2],
                                    Heterozygotes = dat2Heterozygotes[,2], 
                                    Unknown = dat2Unknown[,2])
                        row.names(dat2unfiltFreq) <- as.character(
                                        dat2Homozygotes[,1]
                                        )
                        dat2unfiltFreq$RowSum <- ifelse((
                                    dat2unfiltFreq$Heterozygotes ==1 
                                    & (dat2unfiltFreq$Homozygote == 0 
                                    & dat2unfiltFreq$Unknown == 0)), 1, 2)
                        UnfilteredFrequency  = sum(dat2unfiltFreq$RowSum)
                        } else{
                            UnfilteredFrequency = 0
                        }
                        
                  
                    ##Calculating filtered Frequency INDEL
                    ##Zygosity Parent
                        if(length(dat2DadEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2DadEqual$Zygosity))) == 1){
                                fatherZygosity<-as.character(
                                unique(dat2DadEqual$Zygosity)
                                )
                            }else {
                                fatherZygosity <- paste(
                                as.character(dat2DadEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        } else if (length(dat2DadRange$Zygosity) > 0){
                        fatherzygosity <- as.character(dat2DadRange$Zygosity)
                        fatherZygosity1 <- gsub("-", NA, fatherzygosity)
                        fatherZygosity1 <- as.character(
                                na.omit(fatherZygosity1)
                                )
                        if(length(fatherZygosity1) == 1){
                            fatherZygosity<-as.character(
                            unique(fatherZygosity1)
                            )
                        }else {
                            fatherZygosity <- paste(
                                as.character(fatherZygosity1), 
                                collapse = ","
                                )
                        }
                        }else {
                            fatherZygosity <- "-"
                            }
                       
                        ###Mother Zygosity
                        if(length(dat2MomEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2MomEqual$Zygosity))) == 1){
                                motherZygosity<-as.character(
                                unique(dat2MomEqual$Zygosity)
                                    )
                            }else {
                                motherZygosity <- paste(
                                as.character(dat2MomEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        }else if (length(dat2MomRange$Zygosity) > 0){
                        motherZygosity <- as.character(dat2MomRange$Zygosity)
                        motherZygosity1 <- gsub("-", NA, motherZygosity)
                        motherZygosity1 <- as.character(
                                na.omit(motherZygosity1)
                                )
                        if(length(motherZygosity1) == 1){
                            motherZygosity<-as.character(
                            unique(motherZygosity1)
                            )
                        }else {
                            motherZygosity <- paste(
                                as.character(motherZygosity1), 
                                collapse = ","
                                )
                        }
                        } else {
                            motherZygosity <- "-"
                            }
                       
                  
                        'if(length(homozygo)>=1){
                            homozygo <- length(unique(homozygo))
                        }
                        else if(length(homozygo)==1){
                            homozygo <- length(homozygo)
                        }
                        else{
                            homozygo <- 0
                        }'
                                        
                  
                        famno <- unname(hash::values(ha2, keys = sampID))
                        fampas <- paste(
                                "^",as.character(famindexfile$Tag),"$", sep=""
                                )
                        famnopas <- paste("^",as.character(famno),"$",sep="")
                        famnumb <- length(grep(famnopas, fampas, fixed=TRUE))
                        data1 <- data.frame(dat1[nn, ], 
                            Internal_Freq_Perc_Filtered = 
                            as.numeric(format(round(
                            (filtFreq/(2*(usamp - famnumb))) * 100,digits=3)
                            , scientific = FALSE)),
                            Internal_Freq_Perc_Unfiltered = 
                            as.numeric
                            (format(round((UnfilteredFrequency/
                            (2*(usamp - famnumb))) * 100,digits=3), 
                            scientific = FALSE)),
                            Internal_Homozygotes=as.numeric(cntHomozygotes), 
                            MotherZygosity = as.character(motherZygosity), 
                            FatherZygosity = as.character(fatherZygosity),  
                            stringsAsFactors = FALSE)
                        
                        datf <- rbind(datf, data1)
                }  
                else if (nrow(dat2) == 1){
                    # dgv_match=TRUE Calculating percentage similarity
                    countfre <- 0;countfreunfilt<-0
                    conf <- dat2$Confidence
                    size_internal <- dat2$Size
                    BSPQI_status_DB <- as.character(
                        dat2$Found_in_self_BSPQI_molecules)
                    BSSSI_status_DB <- as.character(
                        dat2$Found_in_self_BSSSI_molecules)
                    perc_query_ref <- (size1/size_internal)
                    perc_ref_query <- (size_internal/size1)
                    sv1 <- dat2$nanoID
                    #Found_in_SE_self_molecules <- dat2$Found_in_SE_self_molecules
                    Found_in_SE_self_molecules <- dat2$Found_in_SE_self_molecules 
                    zygo <- as.character(dat2$Zygosity)
                    stt <- strsplit(as.character(sv1), split = "[.]")
                    patID1 <- stt[[1]][2]
                    svfamid1 <- stt[[1]][1]
                    motherZygosity <- ""
                    fatherZygosity <- ""
                    type <- as.character(dat2$Type)
                    typ1 <- as.character(dat2$Type1)
                    typ2 <- as.character(dat2$Type2)
                    homozygo<-c()
                    ##Check for parents
                    if ((perc_ref_query >= perc_similarity_parents 
                        & perc_query_ref >= perc_similarity_parents) 
                        & identical(type, variantType2[nn]) 
                        & (identical(svfamid1, svfamid)) 
                        & ((dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                        & (dat2$RefEndPos <= re_fb_int_parents[nn]))){
                        # Family Extra column zygosity
                        if (patID == 1 & patID1 == 2){
                            motherZygosity <- as.character(zygo)
                            fatherZygosity <- "-"
                        } 
                        else if (patID == 1 & patID1 == 3){
                            motherZygosity <- "-"
                            fatherZygosity <- as.character(zygo)
                        } 
                        else if (patID == patID1){
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        } 
                        else{
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        }
                    }
                    else if ((perc_ref_query >= perc_similarity 
                        & perc_query_ref >= perc_similarity) 
                        & type == variantType2[nn]
                        & !(identical(svfamid1, svfamid)) 
                        & ((size_internal>=limsize)) 
                        & ((BSPQI_status_DB == "yes" 
                        & BSSSI_status_DB == "yes") 
                        | (BSPQI_status_DB == "no" 
                        & BSSSI_status_DB == "yes") 
                        | (BSPQI_status_DB == "yes" 
                        & BSSSI_status_DB == "no")
                        | (BSPQI_status_DB == "yes" 
                        & BSSSI_status_DB == "-") 
                        | (BSPQI_status_DB == "-" 
                        & BSSSI_status_DB == "yes") 
                        | (Found_in_SE_self_molecules == "yes")) 
                        & (conf > indelconf) 
                        & ((typ1=="insertion" & typ2=="insertion") 
                        | (typ1=="insertion" & is.na(typ2)) 
                        | (is.na(typ1) & typ2=="insertion") 
                        | (typ1=="deletion" & typ2=="deletion") 
                        | (typ1=="deletion" & is.na(typ2)) 
                        | (is.na(typ1) & typ2=="deletion")
                        | (typ1 == "-" & typ2 == "-" & type =="deletion")
                        | (typ1 == "-" & typ2 == "-" & type =="insertion")))
                        {
                        #print("not in a family")
                        if(as.character(zygo)=="homozygous"){
                            countfre <- 2
                            if(as.character(zygo)=="homozygous"){
                                homozygo<- as.character(svfamid1)
                            }
                            else{
                                homozygo<- NULL
                            }
                        }
                        else if(zygo=="unknown"){
                            countfre <- 2
                        }
                        else { 
                            countfre <- 1
                        }
                        motherZygosity <- "-"
                        fatherZygosity <- "-"
                    } 
                    else{ 
                        countfre <- 0
                        motherZygosity <- "-"
                        fatherZygosity <- "-"
                    }
                        ###Unfiltered
                    if ((perc_ref_query >= perc_similarity 
                        & perc_query_ref >= perc_similarity) 
                        & identical(type, variantType2[nn]) 
                        & !(identical(svfamid1, svfamid))){
                        if(zygo=="homozygous"){
                            countfreunfilt <- 2
                        }
                        else if(zygo=="unknown"){
                            countfreunfilt <- 2
                        }
                        else{ 
                            countfreunfilt <- 1
                        }
                    } 
                    else{
                        countfreunfilt <- 0
                    }
                    
                    if(length(homozygo)>0){
                        homozygo <- length(unique(homozygo))
                    }
                    else{
                        homozygo=0
                    }
                  
                famno <- as.numeric(unname(hash::values(ha, keys = svfamid)))
                data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered = 
                    as.numeric(format(round((countfre/(2*(usamp - famno))) 
                    * 100,digits=3), scientific = FALSE)),
                    Internal_Freq_Perc_Unfiltered = 
                    as.numeric(format
                    (round((countfreunfilt/(2*(usamp - famno))) 
                    * 100,digits=3), scientific = FALSE)), 
                    Internal_Homozygotes=as.numeric(homozygo), 
                    MotherZygosity = as.character(motherZygosity), 
                    FatherZygosity = as.character(fatherZygosity),  
                    stringsAsFactors = FALSE)
                  
                datf <- rbind(datf, data1)
                } 
                else
                {
                    # dgv_match=FALSE
                    data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered = 0, 
                    Internal_Freq_Perc_Unfiltered = 0, 
                    Internal_Homozygotes= 0, 
                    MotherZygosity = "-", 
                    FatherZygosity = "-", 
                    stringsAsFactors = FALSE)
                    #### print(dim(data1)) print(names(data1)[56:58])
                    #### print(names(datf)[56:58])
                    #### print(identical((names(data1)[56]),(names(datf)[56])))
                    #### print(identical((names(data1)[57]),(names(datf)[57])))
                    #### print(identical((names(data1)[58]),(names(datf)[58])))
                    datf <- rbind(datf, data1)
                    # next;
                }
                
            } else if ((variantType2[nn] == "duplication" |
                    variantType2[nn] == "duplication_split" | 
                    variantType2[nn] == "duplication_inverted" |
                    variantType2[nn] == "insertion"))
                {   
                    dat2 <-dat[which((dat$RefStartPos >= rf_wb_ind[nn] 
                        & dat$RefEndPos <= re_wf_ind[nn])),]
                    size1 <- size_bn[nn]
                    ## Calculating Internal Frequency
                    if (nrow(dat2) > 1){ 
                    dat2$perc_ref_query <- as.numeric(dat2$Size)/size1
                    dat2$perc_query_ref <- size1/as.numeric(dat2$Size)
                    stt12 <- str_split(as.character(dat2$nanoID), pattern = "\\.")
                    famid <- c(); relnid <- c()
                    dat2$FamilyID <- sapply(stt12, function(x) x[1])
                    dat2$RelationID <- sapply(stt12, function(x) x[2])
                    dat2MomEqual_duplication <- dat2[which((
                            (dat2$RefStartPos ==rf[nn]) 
                            & (dat2$RefEndPos==re[nn]))  
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents)
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2)
                            & ((as.character(dat2$Type) == "duplication") |
                            (as.character(dat2$Type) == "duplication_split") |
                            (as.character(dat2$Type) == "duplication_inverted")
                        )),]
                    dat2DadEqual_duplication <- dat2[which((
                            (dat2$RefStartPos ==rf[nn]) 
                            & (dat2$RefEndPos==re[nn]))  
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents)
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 
                            & dat2$RelationID == 3)
                            & ((as.character(dat2$Type) == "duplication") |
                            (as.character(dat2$Type) == "duplication_split") |
                            (as.character(dat2$Type) == "duplication_inverted")
                        )),]
                    dat2MomRange_duplication <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_ind_parents[nn])
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            &  dat2$perc_query_ref >= perc_similarity_parents) 
                            & (dat2$RefEndPos <= re_wf_ind_parents[nn]))
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2)
                            & ((as.character(dat2$Type) == "duplication") 
                            | (as.character(dat2$Type) == "duplication_split") 
                            | (as.character(dat2$Type) == "duplication_inverted")
                        )),]
                    dat2DadRange_duplication <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_ind_parents[nn])
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            &  dat2$perc_query_ref >= perc_similarity_parents)                            
                            & (dat2$RefEndPos <= re_wf_ind_parents[nn]))
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 3)
                            & ((as.character(dat2$Type) == "duplication") 
                            | (as.character(dat2$Type) == "duplication_split") 
                            | (as.character(dat2$Type) == "duplication_inverted")
                        )),]
                    dat2MomEqual_insertion <- dat2[which(
                            ((dat2$RefStartPos ==rf[nn]) 
                            & (dat2$RefEndPos==re[nn])) 
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents) 
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2) 
                            & ((as.character(dat2$Type) == "insertion")
                        )),]
                    dat2DadEqual_insertion <- dat2[which(
                            ((dat2$RefStartPos ==rf[nn]) 
                            & (dat2$RefEndPos==re[nn])) 
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents) 
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 3) 
                            & ((as.character(dat2$Type) == "insertion")
                        )),]
                    dat2MomRange_insertion <- dat2[which(((
                        dat2$RefStartPos >= rf_wb_ind_parents[nn]) 
                        & (dat2$RefEndPos <= re_wf_ind_parents[nn])) 
                        & (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1 & dat2$RelationID == 2) 
                        & ((as.character(dat2$Type) == "insertion")
                        )),]
                    dat2DadRange_insertion <- dat2[which(((
                        dat2$RefStartPos >= rf_wb_ind_parents[nn]) 
                        & (dat2$RefEndPos <= re_wf_ind_parents[nn])) 
                        & (dat2$perc_ref_query >= perc_similarity_parents 
                        & dat2$perc_query_ref >= perc_similarity_parents) 
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) == svfamid)
                        & (patID == 1 & dat2$RelationID == 3) 
                        & ((as.character(dat2$Type) == "insertion")
                        )),]
                    dat2FrequencyDuplication <- dat2[which(((
                            as.character(dat2$Type) == "duplication") |
                            (as.character(dat2$Type) == "duplication_split") |
                            (as.character(dat2$Type) == "duplication_inverted"))
                            & (dat2$perc_ref_query >= perc_similarity 
                            & dat2$perc_query_ref >= perc_similarity)
                            & (as.character(dat2$FamilyID) != svfamid)
                            &((dat2$Found_in_self_BSPQI_molecules == "yes" & 
                            dat2$Found_in_self_BSSSI_molecules == "yes") 
                            | (dat2$Found_in_self_BSPQI_molecules == "no" 
                            & dat2$Found_in_self_BSSSI_molecules == "yes") 
                            | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                            & dat2$Found_in_self_BSSSI_molecules == "no") 
                            | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                            & dat2$Found_in_self_BSSSI_molecules == "-") 
                            | (dat2$Found_in_self_BSPQI_molecules == "-" 
                            & dat2$Found_in_self_BSSSI_molecules == "yes")
                            | (dat2$Found_in_SE_self_molecules == "yes"))
                            & ((dat2$Type1 =="duplication" & 
                                dat2$Type2 =="duplication") | 
                                (dat2$Type1 =="duplication" 
                                & is.na(dat2$Type2)) |
                                (is.na(dat2$Type1) & dat2$Type2 =="duplication") 
                                | (dat2$Type1 == "duplication_split" 
                                & dat2$Type2 == "duplication_split") |
                                (dat2$Type1 == "duplication_split"
                                & is.na(dat2$Type2)) | 
                                (is.na(dat2$Type1)
                                & dat2$Type2 =="duplication_split")
                                | (dat2$Type1 == "duplication_inverted" 
                                & dat2$Type2 == "duplication_inverted") 
                                |(dat2$Type1 == "duplication_inverted" 
                                & is.na(dat2$Type2)) | 
                                (is.na(dat2$Type1) 
                                & dat2$Type2 =="duplication_inverted")
                                | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                                & dat2$Type == "duplication_inverted")
                                | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                                & dat2$Type == "duplication")
                                | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                                & dat2$Type == "duplication_split"))
                            & ((dat2$Fail_BSPQI_assembly_chimeric_score == "pass" & 
                            dat2$Fail_BSSSI_assembly_chimeric_score == "pass") 
                            | (dat2$Fail_BSPQI_assembly_chimeric_score == "fail" 
                            & dat2$Fail_BSSSI_assembly_chimeric_score == "pass") 
                            | (dat2$Fail_BSPQI_assembly_chimeric_score == "pass" 
                            & dat2$Fail_BSSSI_assembly_chimeric_score == "fail") 
                            | (dat2$Fail_BSPQI_assembly_chimeric_score == "pass" 
                            & dat2$Fail_BSSSI_assembly_chimeric_score == "-") 
                            | (dat2$Fail_BSPQI_assembly_chimeric_score == "-" 
                            & dat2$Fail_BSSSI_assembly_chimeric_score == "pass")
                            |(dat2$Fail_assembly_chimeric_score_SE == "pass"))),]

                            
                   # dat2FrequencyDuplication <- subset(dat2,(((as.character(dat2$Type) == "duplication") |
                            
                            
                            
                            
                    dat2Insertion <- dat2[which((
                        dat2$perc_ref_query >= perc_similarity 
                        & dat2$perc_query_ref >= perc_similarity) 
                        & (dat2$Size >= limsize)
                        & (as.character(dat2$Type) == variantType2[nn])
                        & (as.character(dat2$FamilyID) != svfamid)
                        & (dat2$Confidence >= indelconf)
                        & ((dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "no" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "no") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "-") 
                        | (dat2$Found_in_self_BSPQI_molecules == "-" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes")
                        | (dat2$Found_in_SE_self_molecules == "yes"))
                        & ((dat2$Type1 =="insertion" & dat2$Type2 =="insertion") 
                        | (dat2$Type1 =="insertion" & is.na(dat2$Type2)) 
                        | (is.na(dat2$Type1) & dat2$Type2 =="insertion") 
                        | (dat2$Type1 == "-" 
                        & dat2$Type2 == "-" & dat2$Type == "insertion")
                        | (dat2$Type == "insertion"))),]
                    dat2UnfilteredFrequency <- dat2[which(((
                        as.character(dat2$Type) == "duplication") |
                        (as.character(dat2$Type) == "duplication_split") |
                        (as.character(dat2$Type) == "duplication_inverted") |
                        (as.character(dat2$Type) == "insertion"))
                        & (dat2$perc_ref_query >= perc_similarity 
                        & dat2$perc_query_ref >= perc_similarity)
                        & (as.character(dat2$FamilyID) != svfamid)),]
                    if (nrow(dat2FrequencyDuplication) > 0 & 
                            nrow(dat2Insertion) > 0){
                            dat2Frequency <- rbind(
                                dat2FrequencyDuplication, dat2Insertion
                                )
                            }
                    else if(nrow(dat2FrequencyDuplication) > 0 & 
                            nrow(dat2Insertion) == 0){
                            dat2Frequency <- dat2FrequencyDuplication
                            }
                    else if(nrow(dat2FrequencyDuplication) == 0 & 
                            nrow(dat2Insertion) > 0){
                            dat2Frequency <- dat2Insertion
                            }
                    else{dat2Frequency <- c()}
                            
                            
                            
                            
                        ##Calculating filtered Frequency INDEL
                        ##Filtration
                 
                        ##Filtered
                    if (is.null(dat2Frequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }    
                    else if (nrow(dat2Frequency) > 0){
                        
                        countfre1 <- 0
                        dat2Homozygotes <- data.frame(dat2Frequency 
                        %>%     mutate(Homozygo = .data$Zygosity=="homozygous") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Homozygotes = sum(.data$Homozygo)))
                        cntHomozygotes <- sum(dat2Homozygotes$Homozygo)
                        dat2Homozygotes [,2] <- ifelse(
                                dat2Homozygotes[,2] > 0, 2, 0
                                )
                        dat2Heterozygotes <- data.frame(dat2Frequency 
                        %>%     mutate(Heterozygo = .data$Zygosity == "heterozygous") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Heterozygotes = sum(.data$Heterozygo)))
                        dat2Heterozygotes [,2] <- ifelse(
                                    dat2Heterozygotes[,2] > 0, 1, 0
                                    )
                        dat2Unknown <- data.frame(dat2Frequency 
                        %>%     mutate(Unknown = .data$Zygosity == "unknown") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Unknown = sum(.data$Unknown)))
                        dat2Unknown [,2] <- ifelse(
                                    dat2Unknown[,2] > 0, 2, 0
                                )
                        dat2filtFreq <- data.frame(
                                    NR = dat2Homozygotes[,1], 
                                    Homozygote = dat2Homozygotes[,2], 
                                    Heterozygotes = dat2Heterozygotes[,2], 
                                    Unknown = dat2Unknown[,2])
                        row.names(dat2filtFreq) <- as.character(
                                    dat2Homozygotes[,1]
                                    )
                        dat2filtFreq$RowSum <- ifelse((
                                    dat2filtFreq$Heterozygotes ==1 
                                    & (dat2filtFreq$Homozygote == 0 
                                    & dat2filtFreq$Unknown == 0)), 1, 2)
                        filtFreq <- sum(dat2filtFreq$RowSum)
                        } else{
                            filtFreq  = 0
                            cntHomozygotes = 0
                        }
                        
                    
                    ###Unfiltered
                    if (is.null(dat2UnfilteredFrequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }    
                    else if (nrow(dat2UnfilteredFrequency) > 0){
                        dat2Homozygotes <- data.frame(dat2UnfilteredFrequency
                        %>%     mutate(Homozygo=.data$Zygosity=="homozygous") 
                        %>%     group_by(.data$nanoID) 
                        %>%     summarise (Homozygotes = sum(.data$Homozygo)))
                        #cntHomozygotes <- sum(dat2Homozygotes$Homozygotes)
                        dat2Homozygotes [,2] <- ifelse(
                                    dat2Homozygotes[,2] > 0, 2, 0
                                    )
                        dat2Heterozygotes <- data.frame(
                                    dat2UnfilteredFrequency 
                                    %>%     mutate(
                                    Heterozygo = .data$Zygosity == "heterozygous"
                                    ) 
                                    %>%     group_by(.data$nanoID) 
                                    %>%     summarise (Heterozygotes = sum(.data$Heterozygo))
                                    )
                        dat2Heterozygotes [,2] <- ifelse(
                                    dat2Heterozygotes[,2] > 0, 1, 0
                                    )
                        dat2Unknown <- data.frame(
                                dat2UnfilteredFrequency 
                                %>%     mutate(Unknown = .data$Zygosity == "unknown") 
                                %>%     group_by(.data$nanoID) 
                                %>%     summarise (Unknown = sum(.data$Unknown)))
                        dat2Unknown [,2] <- ifelse(
                                        dat2Unknown[, 2] > 0, 2, 0
                                        )
                        dat2unfiltFreq <- data.frame(
                                    Homozygote = dat2Homozygotes[,2],
                                    Heterozygotes = dat2Heterozygotes[,2], 
                                    Unknown = dat2Unknown[,2]
                                    )
                        row.names(dat2unfiltFreq) <- as.character(
                                    dat2Homozygotes[,1]
                                    )
                        dat2unfiltFreq$RowSum <- ifelse(
                                        (dat2unfiltFreq$Heterozygotes ==1 
                                        & (dat2unfiltFreq$Homozygote == 0 
                                        & dat2unfiltFreq$Unknown == 0)), 1, 2)
                        UnfilteredFrequency  = sum(dat2unfiltFreq$RowSum)
                        } else{
                            UnfilteredFrequency = 0
                        }
                    dat2DadEqual <- rbind(dat2DadEqual_duplication, dat2DadEqual_insertion)
                    dat2MomEqual <- rbind(dat2MomEqual_duplication, dat2MomEqual_insertion)
                    dat2DadRange <- rbind(dat2DadRange_duplication, dat2DadRange_insertion)
                    dat2MomRange <- rbind(dat2MomRange_duplication, dat2MomRange_insertion)
                 
                    ##Calculating filtered Frequency INDEL
                    ##Zygosity Parent
                        if(length(dat2DadEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2DadEqual$Zygosity))) == 1){
                                fatherZygosity<-as.character(
                                unique(dat2DadEqual$Zygosity)
                                )
                            }else {
                                fatherZygosity <- paste(
                                as.character(dat2DadEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        } else if (length(dat2DadRange$Zygosity) > 0){
                        fatherzygosity <- as.character(dat2DadRange$Zygosity)
                        fatherZygosity1 <- gsub("-", NA, fatherzygosity)
                        fatherZygosity1 <- as.character(
                                na.omit(fatherZygosity1)
                                )
                        if(length(fatherZygosity1) == 1){
                            fatherZygosity<-as.character(
                            unique(fatherZygosity1)
                            )
                        } 
                        else {
                            fatherZygosity <- paste(
                                as.character(fatherZygosity1), 
                                collapse = ","
                                )
                        }
                        } else {
                            fatherZygosity <- "-"
                            }
                       
                        ###Mother Zygosity
                        if(length(dat2MomEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2MomEqual$Zygosity))) == 1){
                                motherZygosity<-as.character(
                                    unique(dat2MomEqual$Zygosity)
                                    )
                            }else {
                                motherZygosity <- paste(
                                as.character(dat2MomEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        } else if (length(dat2MomRange$Zygosity) > 0){
                        motherZygosity <- as.character(dat2MomRange$Zygosity)
                        motherZygosity1 <- gsub("-", NA, motherZygosity)
                        motherZygosity1 <- as.character(
                                na.omit(motherZygosity1)
                                )
                        if(length(motherZygosity1) == 1){
                            motherZygosity<-as.character(
                            unique(motherZygosity1)
                            )
                        } 
                        else {
                            motherZygosity <- paste(
                                as.character(motherZygosity1), 
                                collapse = ","
                                )
                        }
                        } else {
                            motherZygosity <- "-"
                            }
                       
                  
                  
                   
                        famno <- unname(hash::values(ha2, keys = sampID))
                        fampas <- paste("^",as.character(
                                famindexfile$Tag),"$",sep=""
                                )
                        famnopas <- paste("^",as.character(famno),"$",sep="")
                        famnumb <- length(grep(famnopas, fampas, fixed=TRUE))
                        data1 <- data.frame(dat1[nn, ], 
                            Internal_Freq_Perc_Filtered = 
                            as.numeric(format(round(
                            (filtFreq/(2*(usamp - famnumb))) * 100,digits=3)
                            , scientific = FALSE)),
                            Internal_Freq_Perc_Unfiltered = 
                            as.numeric
                            (format(round((UnfilteredFrequency/
                            (2*(usamp - famnumb))) * 100,digits=3), 
                            scientific = FALSE)),
                            Internal_Homozygotes=as.numeric(cntHomozygotes), 
                            MotherZygosity = as.character(motherZygosity), 
                            FatherZygosity = as.character(fatherZygosity),  
                            stringsAsFactors = FALSE)
                   
                    datf <- rbind(datf, data1)
                    }
                    else if (nrow(dat2) == 1){ 
                        # dgv_match=TRUE Calculating percentage similarity
                        countfre <- 0;countfreunfilt<-0
                        svv <- dat2$nanoID
                        #size_internal <- dat2$Size
                        conf <- dat2$Confidence
                        #Found_in_SE_self_molecules <- dat2$Found_in_SE_self_molecules
                        #dat2$Fail_assembly_chimeric_score_SE_DLE <- dat2$dat2$Fail_assembly_chimeric_score_SE_DLE
                        BSPQI_status_DB <- 
                        as.character(dat2$Found_in_self_BSPQI_molecules)
                        BSSSI_status_DB <- 
                        as.character(dat2$Found_in_self_BSSSI_molecules)
                        BSPQI_chimeric_score_DB <-  as.character(
                                dat2$Fail_BSPQI_assembly_chimeric_score
                            )
                        BSSSI_chimeric_score_DB <- as.character(
                                dat2$Fail_BSSSI_assembly_chimeric_score
                                )
                        Found_in_SE_self_molecules <- dat2$Found_in_SE_self_molecules
                        Fail_assembly_chimeric_score_SE <- dat2$Fail_assembly_chimeric_score_SE 
                        perc_ref_query <- as.numeric(dat2$Size)/size1
                        perc_query_ref <- size1/as.numeric(dat2$Size)
                        #svv <- strsplit(as.character(svfam1), split = "_")
                        zygo <- as.character(dat2$Zygosity)
                        stt <- strsplit(as.character(svv), split = "[.]")
                        patID1 <- stt[[1]][2]
                        homozygo<-c()
                        svfamid1 <- stt[[1]][1]
                        motherZygosity <- ""
                        fatherZygosity <- ""
                        type <- as.character(dat2$Type)
                        typ1 <- as.character(dat2$Type1)
                        typ2 <- as.character(dat2$Type2)
                  #print(type)
                        if (((dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                        & (dat2$RefEndPos <= re_fb_int_parents[nn]))
                        & ((identical(type, "duplication") 
                        | identical(type, "duplication_split")| 
                        identical(type, "duplication_inverted"))) 
                        & (perc_ref_query >= perc_similarity_parents 
                        & perc_query_ref >= perc_similarity_parents)                        
                        & (identical(svfamid1, svfamid)) )
                        {
                            'print(type)
                            print(svfamid1)
                            print(svfamid)
                            print(BSPQI_status_DB)
                            print(BSSSI_status_DB)
                            print(paste(ii,":",nn))'
                            # Family Extra column zygosity
                            if (patID == 1 & patID1 == 2){
                                motherZygosity <- as.character(zygo)
                                fatherZygosity <- "-"
                            } 
                            else if (patID == 1 & patID1 == 3){
                                motherZygosity <- "-"
                                fatherZygosity <- as.character(zygo)
                            } 
                            else if (patID == patID1){
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            } 
                            else{
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            }
                        } 
                        else if (((identical(type, "duplication") 
                            | identical(type, "duplication_split")
                            | identical(type, "duplication_inverted"))) 
                            & (perc_ref_query >= perc_similarity 
                            & perc_query_ref >= perc_similarity)
                            & !(identical(svfamid1, svfamid)) 
                            & ((BSPQI_status_DB == "yes" 
                            & BSSSI_status_DB == "yes") 
                            | (BSPQI_status_DB == "no" 
                            & BSSSI_status_DB == "yes") 
                            | (BSPQI_status_DB == "yes" 
                            & BSSSI_status_DB == "no") 
                            | (BSPQI_status_DB == "yes" 
                            & BSSSI_status_DB == "-") 
                            | (BSPQI_status_DB == "-" 
                            & BSSSI_status_DB == "yes")
                            | (Found_in_SE_self_molecules == "yes")) 
                            & ((BSPQI_chimeric_score_DB == "pass" 
                            & BSSSI_chimeric_score_DB == "pass") 
                            | (BSPQI_chimeric_score_DB == "fail" 
                            & BSSSI_chimeric_score_DB == "pass") 
                            | (BSPQI_chimeric_score_DB == "pass" 
                            & BSSSI_chimeric_score_DB == "fail") 
                            | (BSPQI_chimeric_score_DB == "pass" 
                            & BSSSI_chimeric_score_DB == "-") 
                            | (BSPQI_chimeric_score_DB == "-" 
                            & BSSSI_chimeric_score_DB == "pass")
                            | (Fail_assembly_chimeric_score_SE == "pass")) 
                            & ((typ1=="duplication" & typ2=="duplication") 
                            | (typ1=="duplication" & is.na(typ2)) 
                            | (is.na(typ1) & typ2=="duplication") 
                            | (typ1=="duplication_split" 
                            & typ2=="duplication_split") 
                            | (typ1=="duplication_split" & is.na(typ2)) 
                            | (is.na(typ1) & typ2=="duplication_split") 
                            | (typ1=="duplication_inverted" 
                            & typ2=="duplication_inverted") 
                            | (typ1=="duplication_inverted" & is.na(typ2)) 
                            | (is.na(typ1) & typ2=="duplication_inverted")
                            | (typ1=="-" & typ2=="-" & type == "duplication")
                            | (typ1=="-" & typ2=="-" 
                            & type == "duplication_inverted")
                            | (typ1=="-" & typ2=="-" 
                            & type == "duplication_split"))){
                            if(zygo=="homozygous"){
                                countfre <- 2
                            }
                            else if(zygo=="unknown"){
                                countfre <- 2
                            }
                            else{ 
                                countfre <- 1
                            }
                            if(as.character(zygo)=="homozygous"){
                                homozygo <- as.character(svfamid1)
                            }
                            else{
                                homozygo<- NULL
                            }
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                            'motherZygosity <- "-"
                            fatherZygosity <- "-"'
                        } 
                        else if (((identical(type, "insertion"))) & 
                        (identical(svfamid1, svfamid)) & 
                        ((dat2$RefStartPos >= rf_wb_int_parents[nn]) & 
                        (dat2$RefEndPos <= re_fb_int_parents[nn])) 
                        & (perc_ref_query >= perc_similarity_parents 
                        & perc_query_ref >= perc_similarity_parents)){
                            # Family Extra column zygosity
                            if (patID == 1 & patID1 == 2){
                                motherZygosity <- as.character(zygo)
                                fatherZygosity <- "-"
                            }
                            else if (patID == 1 & patID1 == 3){
                                motherZygosity <- "-"
                                fatherZygosity <- as.character(zygo)
                            } 
                            else if (patID == patID1){
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            }
                            else {
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            }
                        } 
                        else if (((identical(type, "insertion"))) & 
                        !(identical(svfamid1, svfamid)) 
                        & (perc_ref_query >= perc_similarity 
                        & perc_query_ref >= perc_similarity) 
                        & ((BSPQI_status_DB == "yes" &
                        BSSSI_status_DB == "yes") |
                        (BSPQI_status_DB == "no" & 
                        BSSSI_status_DB == "yes") |
                        (BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "no") |
                        (BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "-") |
                        (BSPQI_status_DB == "-" & 
                        BSSSI_status_DB == "yes")
                        | (Found_in_SE_self_molecules == "yes")) & 
                        ((size_internal>=limsize)) & 
                        (conf > indelconf) & 
                        ((typ1=="insertion" & typ2=="insertion") |
                        (typ1=="insertion" & is.na(typ2)) | 
                        (is.na(typ1) & typ2=="insertion")
                        | (typ1=="-" & typ2=="-" & type == "insertion"))){
                            if(zygo=="homozygous"){
                                countfre <- 2
                            }
                            else if(zygo=="unknown"){
                                countfre <- 2
                            }
                            else{ 
                                countfre <- 1
                            }
                            if(as.character(zygo)=="homozygous"){
                                homozygo <- as.character(svfamid1)
                            }
                            else{
                                homozygo <- NULL
                            }
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        } 
                        else {
                            countfre <- 0
                    
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                   
                        }
                        if (((identical(type, "duplication") |
                            identical(type, "duplication_split")| 
                            identical(type, "duplication_inverted")|
                            identical(type, "insertion"))) 
                            & (perc_ref_query >= perc_similarity 
                            & perc_query_ref >= perc_similarity)
                            & !(identical(svfamid1, svfamid))){
                            if(zygo=="homozygous"){
                                countfreunfilt <- 2
                            }
                            else if(zygo=="unknown"){
                                countfreunfilt <- 2
                            }
                            else{ 
                                countfreunfilt <- 1
                            }
                    
                        }
                        else{
                            countfreunfilt <- 0
                        }
                    
                    if(length(homozygo)>0){
                        homozygo <- length(homozygo)
                    }
                    else{
                        homozygo= 0
                    }
                  
                    famno <- as.numeric(unname(hash::values(ha, keys = svfamid)
                        ))
                    data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered = 
                    as.numeric(format(round((countfre/(2*(usamp - famno))) 
                    * 100,digits=3), scientific = FALSE)),
                    Internal_Freq_Perc_Unfiltered = as.numeric(format(round((
                    countfreunfilt/(2*(usamp - famno))) * 100,digits=3), scientific = FALSE)),
                    Internal_Homozygotes=as.numeric(homozygo), 
                    MotherZygosity = as.character(motherZygosity), 
                    FatherZygosity = as.character(fatherZygosity), 
                    stringsAsFactors = FALSE)
                    
                    datf <- rbind(datf, data1)
                   } 
                   else
                   {
                    # dgv_match=FALSE
                    data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered = 0, 
                    Internal_Freq_Perc_Unfiltered = 0,
                    Internal_Homozygotes= 0, 
                    MotherZygosity = "-", 
                    FatherZygosity = "-", 
                    stringsAsFactors = FALSE)
                  #### print(dim(data1)) print(names(data1)[56:58])
                  #### print(names(datf)[56:58])
                  #### print(identical((names(data1)[56]),(names(datf)[56])))
                  #### print(identical((names(data1)[57]),(names(datf)[57])))
                  #### print(identical((names(data1)[58]),(names(datf)[58])))
                     datf <- rbind(datf, data1)
                  # next;
                }
                
            }
            else if ((length(grep("inversion", variantType2[nn])) >= 1) | 
            (length(grep("translocation", variantType2[nn])) >= 1)) {
                if((length(grep("translocation", variantType2[nn])) >= 1)){
                    dat2 <- dat[which(((dat$RefStartPos <= rf[nn] & 
                        dat$RefStartPos >= rf_wb_ind[nn]) | 
                        (dat$RefStartPos >= rf[nn] & dat$RefStartPos <= 
                        rf_fb_ind[nn])) & ((dat$RefEndPos >= re[nn] & 
                        dat$RefEndPos <= re_wf_ind[nn]) |
                        (dat$RefEndPos <= re[nn] & dat$RefEndPos >= re_wb_ind[nn]))
                        ), ]
                    size1 <- size_bn[nn]
                    dat2$perc_ref_query <- rep(0, nrow(dat2))
                    dat2$perc_query_ref <- rep(0, nrow(dat2))
                }else {
                    dat2 <-dat[which((dat$RefStartPos >= rf_wb_ind[nn] 
                        & dat$RefEndPos <= re_wf_ind[nn])),]
                    size1 <- size_bn[nn]
                    ## Calculating Internal Frequency
                    dat2$perc_ref_query <- as.numeric(dat2$Size)/size1
                    dat2$perc_query_ref <- size1/as.numeric(dat2$Size)
                }    
                 
                
                
                ## Writing if the dgv_match is TRUE or not
                
                if (nrow(dat2) > 1){
                    #dat2$perc <- as.numeric(dat2$Size)/size1
                    stt12 <- str_split(as.character(dat2$nanoID), pattern = "\\.")
                    famid <- c(); relnid <- c()
                    dat2$FamilyID <- sapply(stt12, function(x) x[1])
                    dat2$RelationID <- sapply(stt12, function(x) x[2])
                    if((length(grep("inversion", variantType2[nn])) >= 1)){
                        dat2MomEqual <- dat2[which(((dat2$RefStartPos ==rf[nn]) 
                                & (dat2$RefEndPos==re[nn])) 
                                & (dat2$perc_ref_query >= perc_similarity_parents 
                                & dat2$perc_query_ref >= perc_similarity_parents)
                                & (dat2$RefcontigID2 == chromo2[nn]) 
                                & (as.character(dat2$Type) == variantType2[nn])
                                & (as.character(dat2$FamilyID) == svfamid)
                                & (patID == 1 & dat2$RelationID == 2)),]
                        dat2DadEqual <- dat2[which(((dat2$RefStartPos ==rf[nn]) 
                                & (dat2$RefEndPos==re[nn])) 
                                & (dat2$perc_ref_query >= perc_similarity_parents 
                                & dat2$perc_query_ref >= perc_similarity_parents)
                                & (dat2$RefcontigID2 == chromo2[nn]) 
                                & (as.character(dat2$Type) == variantType2[nn])
                                & (as.character(dat2$FamilyID) == svfamid)
                                & (patID == 1 & dat2$RelationID == 3)),]
                        dat2MomRange <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                            & (dat2$RefEndPos <= re_fb_int_parents[nn]))  
                            & (dat2$RefcontigID2 == chromo2[nn]) 
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents)
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2)),]
                            
                        dat2DadRange <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                            & (dat2$RefEndPos <= re_fb_int_parents[nn]))  
                            & (dat2$RefcontigID2 == chromo2[nn]) 
                            & (dat2$perc_ref_query >= perc_similarity_parents 
                            & dat2$perc_query_ref >= perc_similarity_parents)
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 3)),]
                        dat2UnfilteredFrequency <-  dat2[which((
                            (dat2$RefcontigID2 == chromo2[nn]) 
                            & (dat2$perc_ref_query >= perc_similarity 
                            & dat2$perc_query_ref >= perc_similarity)
                            & ((as.character(dat2$Type) == "inversion")
                            & (as.character(dat2$FamilyID) != svfamid)))),]
                          
                    }else{
                        dat2MomEqual <- dat2[which(((dat2$RefStartPos ==rf[nn]) 
                                & (dat2$RefEndPos==re[nn])) 
                                & (dat2$RefcontigID2 == chromo2[nn]) 
                                & (as.character(dat2$Type) == variantType2[nn])
                                & (as.character(dat2$FamilyID) == svfamid)
                                & (patID == 1 & dat2$RelationID == 2)),]
                        dat2DadEqual <- dat2[which(((dat2$RefStartPos ==rf[nn]) 
                                & (dat2$RefEndPos==re[nn])) 
                                & (dat2$RefcontigID2 == chromo2[nn]) 
                                & (as.character(dat2$Type) == variantType2[nn])
                                & (as.character(dat2$FamilyID) == svfamid)
                                & (patID == 1 & dat2$RelationID == 3)),]
                        dat2MomRange <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                            & (dat2$RefEndPos <= re_fb_int_parents[nn]))  
                            & (dat2$RefcontigID2 == chromo2[nn]) 
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 2)),]
                            
                        dat2DadRange <- dat2[which(((
                            dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                            & (dat2$RefEndPos <= re_fb_int_parents[nn]))  
                            & (dat2$RefcontigID2 == chromo2[nn]) 
                            & (as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) == svfamid)
                            & (patID == 1 & dat2$RelationID == 3)),]
                        dat2UnfilteredFrequency <-  dat2[which((
                            (dat2$RefcontigID2 == chromo2[nn]) 
                            & ((as.character(dat2$Type) == variantType2[nn])
                            & (as.character(dat2$FamilyID) != svfamid)))),]
                    }
                    dat2Frequencyinvtrans <- dat2[which(((
                        as.character(dat2$Type) == "inversion" &
                        as.numeric(dat2$Confidence) >= invconf 
                        & (dat2$perc_ref_query >= perc_similarity 
                        & dat2$perc_query_ref >= perc_similarity)
                        & ((dat2$Type1 =="inversion" & dat2$Type2 =="inversion") 
                        | (dat2$Type1 =="inversion" & is.na(dat2$Type2)) 
                        | (is.na(dat2$Type1) & dat2$Type2 =="inversion") 
                        | (dat2$Type1 == "-" 
                        & dat2$Type2 == "-" & dat2$Type == "inversion")))|
                        ((as.character(dat2$Type) == "translocation_intrachr"
                        | as.character(dat2$Type) == "translocation_interchr"
                        | as.character(dat2$Type) == "translocation")
                        & (as.numeric(dat2$Confidence) >= transconf)
                        & ((dat2$Type1 =="translocation" & 
                        dat2$Type2 =="translocation") | 
                        (dat2$Type1 =="translocation" 
                        & is.na(dat2$Type2)) |
                        (is.na(dat2$Type1) & dat2$Type2 =="translocation") 
                        | (dat2$Type1 == "translocation_intrachr" 
                        & dat2$Type2 == "translocation_intrachr") |
                        (dat2$Type1 == "translocation_intrachr"
                        & is.na(dat2$Type2)) | 
                        (is.na(dat2$Type1)
                        & dat2$Type2 =="translocation_intrachr")
                        | (dat2$Type1 == "translocation_interchr" 
                        & dat2$Type2 == "translocation_interchr") 
                        |(dat2$Type1 == "translocation_interchr" 
                        & is.na(dat2$Type2)) | 
                        (is.na(dat2$Type1) 
                        & dat2$Type2 =="translocation_interchr")
                        | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                        & dat2$Type == "translocation_interchr")
                        | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                        & dat2$Type == "translocation")
                        | (dat2$Type1 == "-" & dat2$Type2 == "-" 
                        & dat2$Type == "translocation_intrachr"))))
                        & (as.character(dat2$FamilyID) != svfamid)
                        & (dat2$RefcontigID2 == chromo2[nn]) 
                        &((dat2$Found_in_self_BSPQI_molecules == "yes" & 
                        dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "no" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "no") 
                        | (dat2$Found_in_self_BSPQI_molecules == "yes" 
                        & dat2$Found_in_self_BSSSI_molecules == "-") 
                        | (dat2$Found_in_self_BSPQI_molecules == "-" 
                        & dat2$Found_in_self_BSSSI_molecules == "yes")
                        | (dat2$Found_in_SE_self_molecules == "yes"))
                        & ((dat2$Fail_BSPQI_assembly_chimeric_score == "pass" 
                        & dat2$Fail_BSSSI_assembly_chimeric_score == "pass") 
                        | (dat2$Fail_BSPQI_assembly_chimeric_score == "fail" 
                        & dat2$Fail_BSSSI_assembly_chimeric_score == "pass") 
                        | (dat2$Fail_BSPQI_assembly_chimeric_score == "pass" 
                        & dat2$Fail_BSSSI_assembly_chimeric_score == "fail") 
                        | (dat2$Fail_BSPQI_assembly_chimeric_score == "pass" 
                        & dat2$Fail_BSSSI_assembly_chimeric_score == "-") 
                        | (dat2$Fail_BSPQI_assembly_chimeric_score == "-" 
                        & dat2$Fail_BSSSI_assembly_chimeric_score == "pass")
                        | (dat2$Fail_assembly_chimeric_score_SE == "pass"))),]
                    
                        
                                            
                    dat2Frequency <- dat2Frequencyinvtrans
                  ##Filtered
                    if (is.null(dat2Frequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }
                    else if (nrow(dat2Frequency) > 0){
                        #print(0)
                        countfre1 <- 0
                        dat2Homozygotes <- data.frame(dat2Frequency 
                        %>% mutate(Homozygo = .data$Zygosity=="homozygous") 
                        %>% group_by(.data$nanoID) 
                        %>% summarise (Homozygotes = sum(.data$Homozygo)))
                        cntHomozygotes <- sum(dat2Homozygotes$Homozygo)
                        dat2Homozygotes [,2] <- ifelse(
                                    dat2Homozygotes[,2] > 0, 2, 0
                                    )
                        dat2Heterozygotes <- data.frame(dat2Frequency 
                        %>% mutate(Heterozygo = .data$Zygosity == "heterozygous") 
                        %>% group_by(.data$nanoID) 
                        %>% summarise (Heterozygotes = sum(.data$Heterozygo)))
                        dat2Heterozygotes [,2] <- ifelse(
                                    dat2Heterozygotes[,2] > 0, 1, 0
                                    )
                        dat2Unknown <- data.frame(dat2Frequency 
                        %>% mutate(Unknown = .data$Zygosity == "unknown") 
                        %>% group_by(.data$nanoID) 
                        %>% summarise (Unknown = sum(.data$Unknown)))
                        dat2Unknown [,2] <- ifelse(
                                    dat2Unknown[,2] > 0, 2, 0
                                    )
                        dat2filtFreq <- data.frame(
                                    NR = dat2Homozygotes[,1], 
                                    Homozygote = dat2Homozygotes[,2],
                                    Heterozygotes = dat2Heterozygotes[,2], 
                                    Unknown = dat2Unknown[,2]
                                    )
                        row.names(dat2filtFreq) <- as.character(
                                        dat2Homozygotes[,1]
                                        )
                        dat2filtFreq$RowSum <- ifelse((
                                        dat2filtFreq$Heterozygotes ==1 
                                        & (dat2filtFreq$Homozygote == 0 
                                        & dat2filtFreq$Unknown == 0)), 1, 2)
                        filtFreq <- sum(dat2filtFreq$RowSum)
                        } else{
                            filtFreq  = 0
                            cntHomozygotes = 0
                        }
                        
                    
                    ###Unfiltered
                    
                    if (is.null(dat2UnfilteredFrequency)){
                            filtFreq  = 0
                            cntHomozygotes = 0
                    }
                    else if (nrow(dat2UnfilteredFrequency) > 0){
                        dat2Homozygotes <- data.frame(dat2UnfilteredFrequency 
                        %>% mutate(Homozygo=.data$Zygosity=="homozygous") 
                        %>% group_by(.data$nanoID) 
                        %>% summarise (Homozygotes = sum(.data$Homozygo)))
                        #cntHomozygotes <- sum(dat2Homozygotes$Homozygotes)
                        dat2Homozygotes [,2] <- ifelse(
                                        dat2Homozygotes[,2] > 0, 2, 0
                                        )
                        dat2Heterozygotes <- data.frame(
                                        dat2UnfilteredFrequency 
                                        %>% mutate(
                                        Heterozygo = .data$Zygosity == "heterozygous"
                                        ) 
                                        %>% group_by(.data$nanoID) 
                                        %>% summarise (Heterozygotes = sum(.data$Heterozygo))
                                            )
                        dat2Heterozygotes [,2] <- ifelse(
                                        dat2Heterozygotes[,2] > 0, 1, 0
                                        )
                        dat2Unknown <- data.frame(
                                    dat2UnfilteredFrequency 
                                    %>% mutate(Unknown = .data$Zygosity == "unknown")
                                    %>% group_by(.data$nanoID) 
                                    %>% summarise (Unknown = sum(.data$Unknown))
                                    )
                        dat2Unknown [,2] <- ifelse(
                                   dat2Unknown[, 2] > 0, 2, 0
                                   )
                        dat2unfiltFreq <- data.frame(
                                    Homozygote = dat2Homozygotes[,2],
                                    Heterozygotes = dat2Heterozygotes[,2],
                                    Unknown = dat2Unknown[,2])
                        row.names(dat2unfiltFreq) <- as.character(dat2Homozygotes[,1])
                        dat2unfiltFreq$RowSum <- ifelse((
                                dat2unfiltFreq$Heterozygotes ==1 
                                & (dat2unfiltFreq$Homozygote == 0 
                                & dat2unfiltFreq$Unknown == 0)), 1, 2)
                        UnfilteredFrequency  = sum(dat2unfiltFreq$RowSum)
                        } else{
                            UnfilteredFrequency = 0
                        }
                        
                 
                    ##Calculating filtered Frequency INDEL
                    ##Zygosity Parent
                        if(length(dat2DadEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2DadEqual$Zygosity))) == 1){
                                fatherZygosity<-as.character(
                                unique(dat2DadEqual$Zygosity)
                                )
                            }else {
                                fatherZygosity <- paste(
                                as.character(dat2DadEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        } else if (length(dat2DadRange$Zygosity) > 0){
                        fatherzygosity <- as.character(dat2DadRange$Zygosity)
                        fatherZygosity1 <- gsub("-", NA, fatherzygosity)
                        fatherZygosity1 <- as.character(
                                na.omit(fatherZygosity1)
                                )
                        if(length(fatherZygosity1) == 1){
                            fatherZygosity<-as.character(
                            unique(fatherZygosity1)
                            )
                        } 
                        else {
                            fatherZygosity <- paste(
                                as.character(fatherZygosity1), 
                                collapse = ","
                                )
                        }
                        } else {
                            fatherZygosity <- "-"
                            }
                       
                        ###Mother Zygosity
                        if(length(dat2MomEqual$Zygosity) > 0){
                            if(length(as.character(unique
                            (dat2MomEqual$Zygosity))) == 1){
                                motherZygosity<-as.character(unique(
                                    dat2MomEqual$Zygosity)
                                    )
                            }else {
                                motherZygosity <- paste(
                                as.character(dat2MomEqual$Zygosity), 
                                collapse = ","
                                )
                            }
                        } else if (length(dat2MomRange$Zygosity) > 0){
                        motherZygosity <- as.character(dat2MomRange$Zygosity)
                        motherZygosity1 <- gsub("-", NA, motherZygosity)
                        motherZygosity1 <- as.character(
                                na.omit(motherZygosity1)
                                )
                        if(length(motherZygosity1) == 1){
                            motherZygosity<-as.character(
                            unique(motherZygosity1)
                            )
                        } 
                        else {
                            motherZygosity <- paste(
                                as.character(motherZygosity1), 
                                collapse = ","
                                )
                        }
                        } else {
                            motherZygosity <- "-"
                            }
                       
                  
                  
                   
                        famno <- unname(hash::values(ha2, keys = sampID))
                        fampas <- paste("^",as.character(famindexfile$Tag),"$", 
                                sep="")
                        famnopas <- paste("^",as.character(famno),"$",sep="")
                        famnumb <- length(grep(famnopas, fampas, fixed=TRUE))
                        data1 <- data.frame(dat1[nn, ], 
                            Internal_Freq_Perc_Filtered = 
                            as.numeric(format(round(
                            (filtFreq/(2*(usamp - famnumb))) * 100,digits=3) , scientific = FALSE)),
                            Internal_Freq_Perc_Unfiltered = as.numeric(format(round((
                            UnfilteredFrequency/(2*(usamp - famnumb))) * 100,digits=3), 
                            scientific = FALSE)),
                            Internal_Homozygotes=as.numeric(cntHomozygotes), 
                            MotherZygosity = as.character(motherZygosity), 
                            FatherZygosity = as.character(fatherZygosity), 
                            stringsAsFactors = FALSE)
                        datf <- rbind(datf, data1)
                } 
                else if (nrow(dat2) == 1)
                {
                    ## dgv_match=TRUE Calculating percentage similarity
                    countfre<-0;countfreunfilt<-0
                    chrom2<-dat2$RefcontigID2
                    svv <- dat2$nanoID
                    zygo <- as.character(dat2$Zygosity)
                    stt <- strsplit(as.character(svv), split = "[.]")
                    type <- as.character(dat2$Type)
                    typ1 <- as.character(dat2$Type1)
                    typ2 <- as.character(dat2$Type2)
                    patID1 <- stt[[1]][2]
                    svfamid1 <- stt[[1]][1]
                    conf <- dat2$Confidence
                    perc_ref_query <- dat2$perc_ref_query
                    perc_query_ref <- dat2$perc_query_ref
                    
                    homozygo<-c()
                    #dat2$Fail_assembly_chimeric_score_SE_DLE <- dat2$dat2$Fail_assembly_chimeric_score_SE_DLE
                    Found_in_SE_self_molecules <- dat2$Found_in_SE_self_molecules
                    Fail_assembly_chimeric_score_SE <- dat2$Fail_assembly_chimeric_score_SE
                    BSPQI_status_DB <- as.character(
                    dat2$Found_in_self_BSPQI_molecules)
                    BSSSI_status_DB <- as.character(
                    dat2$Found_in_self_BSSSI_molecules)
                    BSPQI_chimeric_score_DB <- as.character(
                    dat2$Fail_BSPQI_assembly_chimeric_score)
                    BSSSI_chimeric_score_DB <- as.character(
                    dat2$Fail_BSSSI_assembly_chimeric_score)
                    if((length(grep("inversion", variantType2[nn])) >= 1)){
                        
                        if (((dat2$RefStartPos >= rf_wb_int_parents[nn]) 
                            & (dat2$RefEndPos <= re_fb_int_parents[nn])) 
                            & (perc_ref_query >= perc_similarity_parents 
                            & perc_query_ref >= perc_similarity_parents)
                            & identical(chrom2,chromo2[nn])
                            & identical(type, variantType2[nn]) 
                            & identical(svfamid1, svfamid)){
                        # Family Extra column zygosity
                            if (patID == 1 & patID1 == 2){
                                #countfre <- countfre + 0
                                motherZygosity <- as.character(zygo)
                                fatherZygosity <- "-"
                            } 
                            else if (patID == 1 & patID1 == 3){
                                #countfre <- countfre + 0
                                motherZygosity <- "-"
                                fatherZygosity <- as.character(zygo)
                            } 
                            else if (patID == patID1){
                                #countfre <- countfre + 0
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            } 
                            else{
                          
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            }
                        }  
                        else if (identical(chrom2,chromo2[nn]) &
                        identical(type,variantType2[nn]) 
                        & (perc_ref_query >= perc_similarity 
                        & perc_query_ref >= perc_similarity)
                        & !(identical(svfamid1, svfamid)) & 
                        ((BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "yes") | 
                        (BSPQI_status_DB == "no" &
                        BSSSI_status_DB == "yes") | 
                        (BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "no") | 
                        (BSPQI_status_DB == "yes" &
                        BSSSI_status_DB == "-") | 
                        (BSPQI_status_DB == "-" & 
                        BSSSI_status_DB == "yes")
                        |(Found_in_SE_self_molecules == "yes")) 
                        &(conf > invconf)  
                        & ((BSPQI_chimeric_score_DB == "pass" 
                        & BSSSI_chimeric_score_DB == "pass") | 
                        (BSPQI_chimeric_score_DB == "fail" & 
                        BSSSI_chimeric_score_DB == "pass") | 
                        (BSPQI_chimeric_score_DB == "pass" & 
                        BSSSI_chimeric_score_DB == "fail") |
                        (BSPQI_chimeric_score_DB == "pass" & 
                        BSSSI_chimeric_score_DB == "-") | 
                        (BSPQI_chimeric_score_DB == "-" & 
                        BSSSI_chimeric_score_DB == "pass")
                        |(Fail_assembly_chimeric_score_SE == "pass"))
                        & ((typ1=="inversion" & typ2=="inversion") |
                        (typ1=="inversion" & is.na(typ2)) | 
                        (is.na(typ1) & typ2=="inversion")
                        | (typ1=="-" & typ2=="-" & type == "inversion"))){
                            if(zygo=="homozygous"){
                                countfre <- 2
                            }
                            else if(zygo=="unknown"){
                                countfre <- 2
                            }
                            else{ 
                                countfre <- 1
                            }
                            if(as.character(zygo)=="homozygous"){
                                homozygo<- as.character(svfamid1)
                            }
                            else{
                                homozygo<-  NULL
                            }
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        } 
                        else {
                            countfre <- 0
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        }
                    
                    if (identical(chrom2,chromo2[nn]) & 
                        identical(type, variantType2[nn]) 
                        & (perc_ref_query >= perc_similarity 
                        & perc_query_ref >= perc_similarity)
                        & !(identical(svfamid1, svfamid)) ){
                      
                        if(zygo=="homozygous"){
                            countfreunfilt <- 2
                        }
                        else if(zygo=="unknown"){
                            countfreunfilt <- 2
                        }
                        else{ 
                            countfreunfilt <- 1
                        }
                        }
                        else{
                            countfreunfilt <-  0
                        }
                    }else{
                        if (((dat2$RefStartPos >= rf_wb_int_parents[nn]) & 
                            (dat2$RefEndPos <= re_fb_int_parents[nn])) & 
                            identical(chrom2,chromo2[nn])& 
                            identical(type, variantType2[nn]) & 
                            (identical(svfamid1, svfamid))){
                        # Family Extra column zygosity
                            if (patID == 1 & patID1 == 2){
                                countfre <- countfre + 0
                                motherZygosity <- as.character(zygo)
                                fatherZygosity <- "-"
                            } 
                            else if (patID == 1 & patID1 == 3){
                                countfre <- countfre + 0
                                motherZygosity <- "-"
                                fatherZygosity <- as.character(zygo)
                            } 
                            else if (patID == patID1){
                                countfre <- countfre + 0
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            } 
                            else{
                          
                                motherZygosity <- "-"
                                fatherZygosity <- "-"
                            }
                        }  
                        else if (identical(chrom2,chromo2[nn]) &
                        identical(type,variantType2[nn]) &
                        !(identical(svfamid1, svfamid)) & 
                        ((BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "yes") | 
                        (BSPQI_status_DB == "no" &
                        BSSSI_status_DB == "yes") | 
                        (BSPQI_status_DB == "yes" & 
                        BSSSI_status_DB == "no") | 
                        (BSPQI_status_DB == "yes" &
                        BSSSI_status_DB == "-") | 
                        (BSPQI_status_DB == "-" & 
                        BSSSI_status_DB == "yes")
                        |(Found_in_SE_self_molecules == "yes")) 
                        & (conf > transconf)
                        & ((BSPQI_chimeric_score_DB == "pass" 
                        & BSSSI_chimeric_score_DB == "pass") | 
                        (BSPQI_chimeric_score_DB == "fail" & 
                        BSSSI_chimeric_score_DB == "pass") | 
                        (BSPQI_chimeric_score_DB == "pass" & 
                        BSSSI_chimeric_score_DB == "fail") |
                        (BSPQI_chimeric_score_DB == "pass" & 
                        BSSSI_chimeric_score_DB == "-") | 
                        (BSPQI_chimeric_score_DB == "-" & 
                        BSSSI_chimeric_score_DB == "pass")
                        |(Fail_assembly_chimeric_score_SE == "pass"))
                        & ((typ1=="translocation" & typ2=="translocation") 
                        | (typ1=="translocation" & is.na(typ2)) 
                        | (is.na(typ1) & typ2=="translocation") 
                        | (typ1=="translocation_intrachr" 
                        & typ2=="translocation_intrachr") 
                        | (typ1=="translocation_intrachr" & is.na(typ2)) 
                        | (is.na(typ1) & typ2=="translocation_intrachr") 
                        | (typ1=="translocation_interchr" 
                        & typ2=="translocation_interchr") 
                        | (typ1=="translocation_interchr" & is.na(typ2)) 
                        | (is.na(typ1) & typ2=="translocation_interchr")
                        | (typ1=="-" & typ2=="-" & type == "translocation")
                        | (typ1=="-" & typ2=="-" 
                        & type == "translocation_interchr")
                        | (typ1=="-" & typ2=="-" 
                        & type == "translocation_intrachr"))){
                            if(zygo=="homozygous"){
                                countfre <- 2
                            }
                            else if(zygo=="unknown"){
                                countfre <- 2
                            }
                            else{ 
                                countfre <- 1
                            }
                            if(as.character(zygo)=="homozygous"){
                                homozygo<- as.character(svfamid1)
                            }
                            else{
                                homozygo<-  NULL
                            }
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        } 
                        else {
                            countfre <- countfre + 0
                            motherZygosity <- "-"
                            fatherZygosity <- "-"
                        }
                    
                    if (identical(chrom2,chromo2[nn]) & 
                        identical(type, variantType2[nn]) &
                        !(identical(svfamid1, svfamid)) ){
                      
                        if(zygo=="homozygous"){
                            countfreunfilt <- 2
                        }
                        else if(zygo=="unknown"){
                            countfreunfilt <- 2
                        }
                        else{ 
                            countfreunfilt <- 1
                        }
                        }
                        else{
                            countfreunfilt <-  0
                        }
                    }
                     
                    ##Checking for whether there are any homozygous variants or 
                    ##not
                    if(length(homozygo)>0){
                        homozygo <- length(homozygo)
                    }
                    else{
                        homozygo= 0
                    }
                  ##### print(paste('INVTRANS:',countfre,sep=''))
                    famno <- as.numeric(
                        unname(hash::values(ha, keys = svfamid)))
                    data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered = 
                    as.numeric(format(round((
                    countfre/(2*(usamp - famno))) * 100,digits=3), scientific = FALSE)),
                    Internal_Freq_Perc_Unfiltered = as.numeric(format(round((
                    countfreunfilt/(2*(usamp - famno))) * 100,digits=3), scientific = FALSE)), 
                    Internal_Homozygotes=as.numeric(homozygo), 
                    MotherZygosity = as.character(motherZygosity), 
                    FatherZygosity = as.character(fatherZygosity),  
                    stringsAsFactors = FALSE)
                  
                  #### print(dim(data1))
                    datf <- rbind(datf, data1)
                } 
                else{
                 
                    data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered= 0, 
                    Internal_Freq_Perc_Unfiltered =0,
                    Internal_Homozygotes= 0, MotherZygosity = "-", 
                    FatherZygosity = "-",  stringsAsFactors = FALSE)
                  #### print(dim(data1))
                    datf <- rbind(datf, data1)
                   # next;
                }
                    
            }
            else{
                #### print(paste('QueryData:',dim(dat1[nn,]),sep=''))
                
                data1 <- data.frame(dat1[nn, ], 
                    Internal_Freq_Perc_Filtered= 0,
                    Internal_Freq_Perc_Unfiltered = 0, 
                    Internal_Homozygotes= 0, MotherZygosity = "-", 
                    FatherZygosity = "-", stringsAsFactors = FALSE)
                    #### print(dim(data1))
                    datf <- rbind(datf, data1)
            }
            
        }
        dataFinal <- rbind(dataFinal, datf)
    }
    if(returnMethod=="Text"){
        st1 <- strsplit(smap, ".txt")
        fname <- st1[[1]][1]
        row.names(dataFinal) <- c()
        filenam<-paste(fname,"_Int.txt",sep="")
        write.table(dataFinal, file.path(smappath, fname), sep = "\t", 
            row.names = FALSE)
    }
    else if (returnMethod=="dataFrame"){
        return(dataFinal)
    }
    else{
        stop("returnMethod Incorrect")
    }
}
VilainLab/Nanotator documentation built on Aug. 2, 2024, 8:45 p.m.