R/504-readMolFromSmi.R

#' Read Molecules from SMILES Files and Return Parsed Java
#' Molecular Object or Plain Text List
#'
#' Read Molecules from SMILES Files and Return Parsed Java
#' Molecular Object or Plain Text List
#'
#' This function reads molecules from SMILES strings and return
#' parsed Java molecular object or plain text list
#' needed by \code{extractDrug...()} functions.
#'
#' @param smifile Character vector, containing SMILES file location(s).
#' @param type \code{'mol'} or \code{'text'}. \code{'mol'} returns parsed
#'        Java molecular object, used for \code{'text'} returns (plain-text)
#'        character string list. For common molecular descriptors and
#'        fingerprints, use \code{'mol'}.
#'        For descriptors and fingerprints calculated by OpenBabel,
#'        i.e. functions named \code{extractDrugOB...()} , use \code{'text'}.
#'
#' @return A list, containing parsed Java molecular object or character strings.
#'
#' @seealso See \code{\link{readMolFromSDF}} for reading molecules
#' from SDF files and returning parsed Java molecular object.
#'
#' @export readMolFromSmi
#'
#' @examples
#' smi = system.file('vignettedata/FDAMDD.smi', package = 'Rcpi')
#' \donttest{
#' mol1 = readMolFromSmi(smi, type = 'mol')
#' mol2 = readMolFromSmi(smi, type = 'text')}

readMolFromSmi = function (smifile, type = c('mol', 'text')) {

    if (type == 'mol') {

        txt = scan(smifile, what = 'complex', quiet = TRUE)
        smi = as.character(txt)
        mol = parseSmiles(smi)

    } else if (type == 'text') {

        mol = scan(smifile, what = 'complex', quiet = TRUE)

    } else {

        stop('type must be one of "mol" or "text"')

    }

    return(mol)

}
nanxstats/Rcpi documentation built on Sept. 24, 2024, 9:36 a.m.