SCM

SCM Repository

[inlinedocs] Diff of /pkg/inlinedocs/R/parsers.R
ViewVC logotype

Diff of /pkg/inlinedocs/R/parsers.R

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 142, Wed Oct 20 09:21:53 2010 UTC revision 159, Tue Nov 9 16:42:39 2010 UTC
# Line 28  Line 28 
28  ### String without prefixes or newlines.  ### String without prefixes or newlines.
29  }  }
30    
31  ### For each object in the package that satisfies the criterion#  ### For each object in the package that satisfies the criterion
32  ## checked by subfun, parse source using FUN and return the resulting  ### checked by subfun, parse source using FUN and return the resulting
33  ### documentation list.  ### documentation list.
34  forall <- function  forall <- function
35  (FUN,  (FUN,
# Line 136  Line 136 
136    starts <- c(1,bounds+1)    starts <- c(1,bounds+1)
137    ends <- c(bounds,length(clines))    ends <- c(bounds,length(clines))
138    ## detect body of function using paren matching    ## detect body of function using paren matching
139    f <- function(ch)cumsum(nchar(gsub(sprintf("[^%s]",ch),"",src)))    code <- gsub("#.*","",src)
140      f <- function(ch)cumsum(nchar(gsub(sprintf("[^%s]",ch),"",code)))
141    parens <- f("(")-f(")")    parens <- f("(")-f(")")
142    body.begin <- which(diff(parens)<0 & parens[-1]==0)+2    body.begin <- which(diff(parens)<0 & parens[-1]==0)+2
143    is.arg <- function(){    is.arg <- function(){
144      0 == length(grep("^\\s*#",src[start-1],perl=TRUE)) &&      gres <- grep("^\\s*#",src[start-1],perl=TRUE)
145        start<=body.begin      0 == length(gres) && start<=body.begin
146      }      }
147    res <- list()    res <- list()
148    for(i in seq_along(starts)){    for(i in seq_along(starts)){
# Line 165  Line 166 
166    res    res
167  }  }
168    
169  ### Parsers for each object/function that are constructed  extract.xxx.chunks <- function # Extract documentation from a function
 ### automatically. This is a named list, each element is a list of 2  
 ### elements: forfun/forall, then a parser function for an individual  
 ### object.  
 forfun.parsers <-  
   list(prefixed.lines=prefixed.lines,  
        examples.after.return=examples.after.return,  
        ## Extract lots of info from normal functions.  
        parsefun=function(src,name,...){  
          extract.docs.fun(src,name)  
        },  
        ## title from first line of function def  
        title.from.firstline=function(src,name,code,...){  
          if(length(grep("#",src[1]))){  
            list(title=gsub("[^#]*#\\s*(.*)","\\1",src[1],perl=TRUE))  
          } else list()  
        },  
        ## PhG: it is tests/FUN.R!!! I would like more flexibility here  
        ## please, let me choose which dir to use for examples!  
        ## Get examples for FUN from the file tests/FUN.R  
        examples.from.testfile=function(name,...){  
          tsubdir <- getOption("inlinedocs.exdir")  
          if (is.null(tsubdir)) tsubdir <- "tests"       # Default value  
          tfile <- file.path("..",tsubdir,paste(name,".R",sep=""))  
          if(file.exists(tfile))  
            list(examples=paste(readLines(tfile),collapse="\n"))  
          else list()  
        },  
        definition.from.source=function(doc,src,...){  
          def <- doc$definition  
          if(is.null(def)||def=="")  
            list(definition=paste(src,collapse="\n"))  
          else list()  
        })  
   
 ### List of Parser Functions that can be applied to any object.  
 forall.parsers <-  
   list(## Fill in author from DESCRIPTION and titles.  
        author.from.description=function(desc,...){  
          list(author=desc[,"Maintainer"])  
        },  
        ## The format section sometimes causes problems, so erase it.  
        erase.format=function(...){  
          list(format="")  
        },  
        ## Convert the function name to a title.  
        title.from.name=function(name,doc,...){  
          if("title"%in%names(doc))list() else  
          list(title=gsub("[._]"," ",name))  
        },  
        ## PhG: here is what I propose for examples code in the 'ex' attribute  
        examples.in.attr =  function (name, o, ...) {  
          ex <- attr(o, "ex")  
          if (!is.null(ex)) {  
            ## Special case for code contained in a function  
            if (inherits(ex, "function")) {  
              ## If source is available, start from there  
              src <- attr(ex, "source")  
              if (!is.null(src)) {  
                ex <- src  
              } else { ## Use the body of the function  
                ex <- deparse(body(ex))  
              }  
              ## Eliminate leading and trailing code  
              ex <- ex[-c(1, length(ex))]  
              ## Eliminate leading tabulations or 2/4 spaces  
              ex <- sub("^\t|    |  ", "", ex)  
              ## Add an empty line before and after example  
              ex <- c("", ex, "")  
            }  
            list(examples = paste(ex, collapse = "\n"))  
          } else list()  
        })  
   
 ### List of parser functions that operate on single objects. This list  
 ### is useful for testing these functions.  
 lonely <- c(forall.parsers,forfun.parsers)  
 attr(lonely,"ex") <- function(){  
   lonely$parsefun(attr(extract.docs.file,"source"),"extract.docs.file")  
 }  
   
 extra.code.docs <- function # Extract documentation from code chunks  
 ### Parse R code to extract inline documentation from comments around  
 ### each function. These are not able to be retreived simply by  
 ### looking at the "source" attribute. This is a Parser Function that  
 ### can be used in the parser list of package.skeleton.dx(). TODO:  
 ### Modularize this into separate Parsers Functions for S4 classes,  
 ### prefixes, ##<<blocks, etc. Right now it is not very clean!  
 (code,  
 ### Code lines in a character vector containing multiple R objects to  
 ### parse for documentation.  
  objs,  
 ### The objects defined in the code.  
  ...  
 ### ignored  
  ){  
   parsed <- extract.file.parse(code)  
   extract.docs.try <- function(o,on)  
     {  
       ## Note: we could use parsed information here too, but that  
       ## would produce different results for setMethodS3 etc.  
       doc <- list()  
       if ( !is.null(parsed[[on]]) ){  
         if ( !is.na(parsed[[on]]@code[1]) ){ # no code given for generics  
           doc$definition <- paste(parsed[[on]]@code,collapse="\n")  
         }  
         if(!"description"%in%names(doc) && !is.na(parsed[[on]]@description) ){  
           doc$description <- parsed[[on]]@description  
         }  
         if ( "setMethodS3" == parsed[[on]]@created ){  
           # PhG: this may be wrong! It does not catch correctly how the method  
           # must be splitted in case of methods containing dots. for instance,  
           # as.data.frame.matrix must be split into: m1 = as.data.frame and  
           # m2 = matrix... here you got m1 = as, and m2 = data.frame.matrix!!!  
                   pattern <- "^([^\\.]+)\\.(.*)$"  
           doc$s3method=c(m1 <- gsub(pattern,"\\1",on,perl=TRUE),  
               m2 <- gsub(pattern,"\\2",on,perl=TRUE))  
           if ( 0 < length(grep("\\W",m1,perl=TRUE)) ){  
                           m1 <- paste("`",m1,"`",sep="")  
           }  
           cat("S3method(",m1,",",m2,")\n",sep="")  
         }  
       }  
       if("title" %in% names(doc) && !"description" %in% names(doc) ){  
         ## For short functions having both would duplicate, but a  
         ## description is required. Therefore automatically copy title  
         ## across to avoid errors at package build time.  
         doc$description <- doc$title  
       }  
       doc  
     }  
   extract.docs <- function(on){  
     res <- try({o <- objs[[on]]  
                 extract.docs.try(o, on)},FALSE)  
     if(class(res)=="try-error"){  
       cat("Failed to extract docs for: ",on,"\n\n")  
       list()  
     } else if(0 == length(res) && inherits(objs[[on]],"standardGeneric")){  
       NULL  
     } else if(0 == length(res) && "function" %in% class(o)  
               && 1 == length(osource <- attr(o,"source"))  
               && 1 == length(grep(paste("UseMethod(",on,")",sep="\""),osource))  
               ){  
       ## phew - this should only pick up R.oo S3 generic definitions like:  
       ## attr(*, "source")= chr "function(...) UseMethod(\"select\")"  
       NULL  
     } else res  
   }  
   doc.names <- names(objs)  
   res <- sapply(doc.names,extract.docs,simplify=FALSE)  
   ## Special processing for S4 classes as they do not appear in normal ls()  
   for ( nn in names(parsed) ){  
     if ( parsed[[nn]]@created == "setClass" ){  
       S4class.docs <- extract.docs.setClass(parsed[[nn]])  
       docname <- paste(nn,"class",sep="-")  
       if ( is.null(res[[docname]]) ){  
         res[[docname]] <- S4class.docs  
         doc.names <- c(doc.names,docname)  
       } else {  
         stop(nn," appears as both S4 class and some other definition")  
       }  
     }  
   }  
   inherit.docs <- function(on){  
     in.res <- res[[on]]  
     if ( !is.null(parsed[[on]]) ){  
       for ( parent in parsed[[on]]@parent ){  
         if ( !is.na(parent) ){  
           if ( is.null(in.res) ){  
             in.res <- res[[parent]]  
           } else if ( parent %in% names(res) ){  
             parent.docs <- res[[parent]]  
             for ( nn in names(parent.docs) ){  
               if ( !nn %in% names(in.res) ){  
                 in.res[[nn]] <- parent.docs[[nn]]  
               }  
             }  
           }  
         }  
       }  
     }  
     invisible(in.res)  
   }  
   all.done <- FALSE  
   while ( !all.done ){  
     res1 <- sapply(doc.names,inherit.docs,simplify=FALSE)  
     all.done <- identical(res1,res)  
     res <- res1  
   }  
   ## now strip out any generics (which have value NULL in res):  
   res.not.null <- sapply(res,function(x){!is.null(x)})  
   if ( 0 < length(res.not.null) && length(res.not.null) < length(res) ){  
     res <- res[res.not.null]  
   }  
   res  
 ### named list of lists, one for each object to document.  
 }  
   
 ### List of parsers to use by default with package.skeleton.dx.  
 default.parsers <-  
   c(extra.code.docs=extra.code.docs, ## TODO: cleanup!  
     sapply(forfun.parsers,forfun),  
     sapply(forall.parsers,forall),  
     edit.package.file=function(desc,...){  
       in.details <- setdiff(colnames(desc),"Description")  
       details <- paste(paste(in.details,": \\tab ",desc[,in.details],"\\cr",  
                              sep=""),collapse="\n")  
       L <-  
         list(list(title=desc[,"Title"],  
                   description=desc[,"Description"],  
                   `tabular{ll}`=details,  
                   author=desc[,"Maintainer"]))  
       names(L) <- paste(desc[,"Package"],"-package",sep="")  
       L  
     })  
   
 extract.docs.fun <- function # Extract documentation from a function  
170  ### Given source code of a function, return a list describing inline  ### Given source code of a function, return a list describing inline
171  ### documentation in that source code.  ### documentation in that source code.
172  (code,  (src,
173  ### The function to examine.  ### The source lines of the function to examine, as a character
174   name.fun  ### vector.
175     name.fun="(unnamed function)",
176  ### The name of the function/chunk to use in warning messages.  ### The name of the function/chunk to use in warning messages.
177     ...
178    ### ignored.
179   ){   ){
180    res <- list()    res <- list()
181    ##details<< For simple functions/arguments, the argument may also be    ##details<< For simple functions/arguments, the argument may also be
# Line 468  Line 256 
256            else paste(res[[field]], payload, sep=chunk.sep)            else paste(res[[field]], payload, sep=chunk.sep)
257        invisible(chunk.res)        invisible(chunk.res)
258      }      }
259    while ( k <= length(code) ){    while ( k <= length(src) ){
260      line <- code[k]      line <- src[k]
261      if ( 0 < length(grep(extra.regexp,line,perl=TRUE) ) ){      if ( 0 < length(grep(extra.regexp,line,perl=TRUE) ) ){
262        ## we have a new extra chunk - first get field name and any payload        ## we have a new extra chunk - first get field name and any payload
263        new.field <- gsub(extra.regexp,"\\1",line,perl=TRUE)        new.field <- gsub(extra.regexp,"\\1",line,perl=TRUE)
# Line 622  Line 410 
410  ### with the string in this list (implemented in modify.Rd.file).  ### with the string in this list (implemented in modify.Rd.file).
411  }  }
412    
413    ### Parsers for each function that are constructed automatically. This
414    ### is a named list, and each element is a parser function for an
415    ### individual object.
416    forfun.parsers <-
417      list(prefixed.lines=prefixed.lines,
418           examples.after.return=examples.after.return,
419           extract.xxx.chunks=extract.xxx.chunks,
420           ## title from first line of function def
421           title.from.firstline=function(src,name,code,...){
422             if(length(grep("#",src[1]))){
423               list(title=gsub("[^#]*#\\s*(.*)","\\1",src[1],perl=TRUE))
424             } else list()
425           },
426           ## PhG: it is tests/FUN.R!!! I would like more flexibility here
427           ## please, let me choose which dir to use for examples!
428           ## Get examples for FUN from the file tests/FUN.R
429           examples.from.testfile=function(name,...){
430             tsubdir <- getOption("inlinedocs.exdir")
431             if (is.null(tsubdir)) tsubdir <- "tests"       # Default value
432             tfile <- file.path("..",tsubdir,paste(name,".R",sep=""))
433             if(file.exists(tfile))
434               list(examples=paste(readLines(tfile),collapse="\n"))
435             else list()
436           },
437           definition.from.source=function(doc,src,...){
438             def <- doc$definition
439             is.empty <- function(x)is.null(x)||x==""
440             if(is.empty(def) && !is.empty(src))
441               list(definition=paste(src,collapse="\n"))
442             else list()
443           })
444    
445    ### List of Parser Functions that can be applied to any object.
446    forall.parsers <-
447      list(## Fill in author from DESCRIPTION and titles.
448           author.from.description=function(desc,...){
449             list(author=desc[,"Maintainer"])
450           },
451           ## The format section sometimes causes problems, so erase it.
452           erase.format=function(...){
453             list(format="")
454           },
455           ## Convert the function name to a title.
456           title.from.name=function(name,doc,...){
457             if("title"%in%names(doc))list() else
458             list(title=gsub("[._]"," ",name))
459           },
460           ## PhG: here is what I propose for examples code in the 'ex' attribute
461           examples.in.attr =  function (name, o, ...) {
462             ex <- attr(o, "ex")
463             if (!is.null(ex)) {
464               ## Special case for code contained in a function
465               if (inherits(ex, "function")) {
466                 ## If source is available, start from there
467                 src <- attr(ex, "source")
468                 if (!is.null(src)) {
469                   ex <- src
470                 } else { ## Use the body of the function
471                   ex <- deparse(body(ex))
472                 }
473                 ## Eliminate leading and trailing code
474                 ex <- ex[-c(1, length(ex))]
475                 ## Eliminate leading tabulations or 2/4 spaces
476                 ex <- sub("^\t|    |  ", "", ex)
477                 ## Add an empty line before and after example
478                 ex <- c("", ex, "")
479               }
480               list(examples = paste(ex, collapse = "\n"))
481             } else list()
482           })
483    
484    ### List of parser functions that operate on single objects. This list
485    ### is useful for testing these functions.
486    lonely <- c(forall.parsers,forfun.parsers)
487    attr(lonely,"ex") <- function(){
488      f <- function # title
489    ### description
490      (x, ##<< arg x
491       y
492    ### arg y
493       ){
494        ##value<< a list with elements
495        list(x=x, ##<< original x value
496             y=y, ##<< original y value
497             sum=x+y) ##<< their sum
498        ##end<<
499      }
500      src <- attr(f,"source")
501      lonely$extract.xxx.chunks(src)
502      lonely$prefixed.lines(src)
503    }
504    
505    extra.code.docs <- function # Extract documentation from code chunks
506    ### Parse R code to extract inline documentation from comments around
507    ### each function. These are not able to be retreived simply by
508    ### looking at the "source" attribute. This is a Parser Function that
509    ### can be used in the parser list of package.skeleton.dx(). TODO:
510    ### Modularize this into separate Parsers Functions for S4 classes,
511    ### prefixes, ##<<blocks, etc. Right now it is not very clean!
512    (code,
513    ### Code lines in a character vector containing multiple R objects to
514    ### parse for documentation.
515     objs,
516    ### The objects defined in the code.
517     ...
518    ### ignored
519     ){
520      parsed <- extract.file.parse(code)
521      extract.docs.try <- function(o,on)
522        {
523          ## Note: we could use parsed information here too, but that
524          ## would produce different results for setMethodS3 etc.
525          doc <- list()
526          if ( !is.null(parsed[[on]]) ){
527            if ( !is.na(parsed[[on]]@code[1]) ){ # no code given for generics
528              doc$definition <- paste(parsed[[on]]@code,collapse="\n")
529            }
530            if(!"description"%in%names(doc) && !is.na(parsed[[on]]@description) ){
531              doc$description <- parsed[[on]]@description
532            }
533            if ( "setMethodS3" == parsed[[on]]@created ){
534              # PhG: this may be wrong! It does not catch correctly how the method
535              # must be splitted in case of methods containing dots. for instance,
536              # as.data.frame.matrix must be split into: m1 = as.data.frame and
537              # m2 = matrix... here you got m1 = as, and m2 = data.frame.matrix!!!
538                      pattern <- "^([^\\.]+)\\.(.*)$"
539              doc$s3method=c(m1 <- gsub(pattern,"\\1",on,perl=TRUE),
540                  m2 <- gsub(pattern,"\\2",on,perl=TRUE))
541              if ( 0 < length(grep("\\W",m1,perl=TRUE)) ){
542                              m1 <- paste("`",m1,"`",sep="")
543              }
544              cat("S3method(",m1,",",m2,")\n",sep="")
545            }
546          }
547          if("title" %in% names(doc) && !"description" %in% names(doc) ){
548            ## For short functions having both would duplicate, but a
549            ## description is required. Therefore automatically copy title
550            ## across to avoid errors at package build time.
551            doc$description <- doc$title
552          }
553          doc
554        }
555      extract.docs <- function(on){
556        res <- try({o <- objs[[on]]
557                    extract.docs.try(o, on)},FALSE)
558        if(class(res)=="try-error"){
559          cat("Failed to extract docs for: ",on,"\n\n")
560          list()
561        } else if(0 == length(res) && inherits(objs[[on]],"standardGeneric")){
562          NULL
563        } else if(0 == length(res) && "function" %in% class(o)
564                  && 1 == length(osource <- attr(o,"source"))
565                  && 1 == length(grep(paste("UseMethod(",on,")",sep="\""),osource))
566                  ){
567          ## phew - this should only pick up R.oo S3 generic definitions like:
568          ## attr(*, "source")= chr "function(...) UseMethod(\"select\")"
569          NULL
570        } else res
571      }
572      doc.names <- names(objs)
573      res <- sapply(doc.names,extract.docs,simplify=FALSE)
574      ## Special processing for S4 classes as they do not appear in normal ls()
575      for ( nn in names(parsed) ){
576        if ( parsed[[nn]]@created == "setClass" ){
577          S4class.docs <- extract.docs.setClass(parsed[[nn]])
578          docname <- paste(nn,"class",sep="-")
579          if ( is.null(res[[docname]]) ){
580            res[[docname]] <- S4class.docs
581            doc.names <- c(doc.names,docname)
582          } else {
583            stop(nn," appears as both S4 class and some other definition")
584          }
585        }
586      }
587      inherit.docs <- function(on){
588        in.res <- res[[on]]
589        if ( !is.null(parsed[[on]]) ){
590          for ( parent in parsed[[on]]@parent ){
591            if ( !is.na(parent) ){
592              if ( is.null(in.res) ){
593                in.res <- res[[parent]]
594              } else if ( parent %in% names(res) ){
595                parent.docs <- res[[parent]]
596                for ( nn in names(parent.docs) ){
597                  if ( !nn %in% names(in.res) ){
598                    in.res[[nn]] <- parent.docs[[nn]]
599                  }
600                }
601              }
602            }
603          }
604        }
605        invisible(in.res)
606      }
607      all.done <- FALSE
608      while ( !all.done ){
609        res1 <- sapply(doc.names,inherit.docs,simplify=FALSE)
610        all.done <- identical(res1,res)
611        res <- res1
612      }
613      ## now strip out any generics (which have value NULL in res):
614      res.not.null <- sapply(res,function(x){!is.null(x)})
615      if ( 0 < length(res.not.null) && length(res.not.null) < length(res) ){
616        res <- res[res.not.null]
617      }
618      res
619    ### named list of lists, one for each object to document.
620    }
621    
622    ### List of parsers to use by default with package.skeleton.dx.
623    default.parsers <-
624      c(extra.code.docs=extra.code.docs, ## TODO: cleanup!
625        sapply(forfun.parsers,forfun),
626        sapply(forall.parsers,forall),
627        edit.package.file=function(desc,...){
628          in.details <- setdiff(colnames(desc),"Description")
629          details <- paste(paste(in.details,": \\tab ",desc[,in.details],"\\cr",
630                                 sep=""),collapse="\n")
631          L <-
632            list(list(title=desc[,"Title"],
633                      description=desc[,"Description"],
634                      `tabular{ll}`=details,
635                      author=desc[,"Maintainer"]))
636          names(L) <- paste(desc[,"Package"],"-package",sep="")
637          L
638        })
639    
640  setClass("DocLink", # Link documentation among related functions  setClass("DocLink", # Link documentation among related functions
641  ### The \code{.DocLink} class provides the basis for hooking together  ### The \code{.DocLink} class provides the basis for hooking together
642  ### documentation of related classes/functions/objects. The aim is that  ### documentation of related classes/functions/objects. The aim is that
# Line 760  Line 775 
775    ## the same line or \code{### } comments at the beginning of the    ## the same line or \code{### } comments at the beginning of the
776    ## following line.    ## following line.
777    f.n <- paste(class.name,"class",sep="-")    f.n <- paste(class.name,"class",sep="-")
778    docs <- extract.docs.fun(chunk.source,f.n)    docs <- extract.xxx.chunks(chunk.source,f.n)
779    ## also apply source parsing functions that I separated out into    ## also apply source parsing functions that I separated out into
780    ## separate functions    ## separate functions
781    docs <- combine(docs,lonely$prefixed.lines(chunk.source))    docs <- combine(docs,lonely$prefixed.lines(chunk.source))
# Line 805  Line 820 
820    old <- options(keep.source=TRUE)    old <- options(keep.source=TRUE)
821    on.exit(options(old))    on.exit(options(old))
822    exprs <- parse(text=code)    exprs <- parse(text=code)
823    for (i in exprs) eval(i, e)    for (i in exprs){
824        tryCatch(eval(i, e),error=function(e){
825          ##print(e)
826        })
827      }
828    objs <- sapply(ls(e),get,e,simplify=FALSE)    objs <- sapply(ls(e),get,e,simplify=FALSE)
829    
830    docs <- list()    docs <- list()

Legend:
Removed from v.142  
changed lines
  Added in v.159

root@r-forge.r-project.org
ViewVC Help
Powered by ViewVC 1.0.0  
Thanks to:
Vienna University of Economics and Business University of Wisconsin - Madison Powered By FusionForge