diff options
author | Carsten Dominik <carsten.dominik@gmail.com> | 2009-02-18 16:31:14 +0100 |
---|---|---|
committer | Carsten Dominik <carsten.dominik@gmail.com> | 2009-02-18 17:23:47 +0100 |
commit | c0cc9181db53c8c76a8a9cbd14b04266e48bdbbe (patch) | |
tree | 477c9fde674b566959f8c355b8726285edeb9c7c | |
parent | a55dd5a9e62f99ce893c3570ff9f5b45108097d7 (diff) | |
download | org-mode-c0cc9181db53c8c76a8a9cbd14b04266e48bdbbe.tar.gz |
Added org-R.el to contrib/lisp/
-rw-r--r-- | contrib/ChangeLog | 4 | ||||
-rw-r--r-- | contrib/README | 1 | ||||
-rw-r--r-- | contrib/lisp/org-R.el | 852 | ||||
-rwxr-xr-x | lisp/ChangeLog | 2 | ||||
-rw-r--r-- | lisp/org.el | 1 |
5 files changed, 859 insertions, 1 deletions
diff --git a/contrib/ChangeLog b/contrib/ChangeLog index e04c08c..b5ddbeb 100644 --- a/contrib/ChangeLog +++ b/contrib/ChangeLog @@ -1,3 +1,7 @@ +2009-02-18 Carsten Dominik <carsten.dominik@gmail.com> + + * lisp/org-R.el: New file. + 2009-02-13 Carsten Dominik <carsten.dominik@gmail.com> * lisp/org-choose.el (org-choose-get-fn-map-group): Require diff --git a/contrib/README b/contrib/README index 2715a1e..5236daa 100644 --- a/contrib/README +++ b/contrib/README @@ -27,6 +27,7 @@ org-mairix.el --- Hook mairix search into Org for different MUAs org-man.el --- Support for links to manpages in Org-mode org-mtags.el --- Support for some Muse-like tags in Org-mode org-panel.el --- Simple routines for us with bad memory +org-R.el --- Computation using the R language org-registry.el --- A registry for Org links org2rem.el --- Convert org appointments into reminders org-screen.el --- Visit screen sessions through Org-mode links diff --git a/contrib/lisp/org-R.el b/contrib/lisp/org-R.el new file mode 100644 index 0000000..c89a4a9 --- /dev/null +++ b/contrib/lisp/org-R.el @@ -0,0 +1,852 @@ +;;; org-R.el --- Numerical computation and data visualisation for org-mode using R + +;; Copyright (C) 2009 +;; Free Software Foundation, Inc. + +;; Author: Dan Davison <davison@stats.ox.ac.uk> +;; Keywords: org, R, ESS, tables, graphics +;; Homepage: http://www.stats.ox.ac.uk/~davison/software/org-R +;; Version: 0.05 2009-02-05 +;; +;; This file is not part of GNU Emacs. +;; +;; This file is free software; you can redistribute it and/or modify +;; it under the terms of the GNU General Public License as published by +;; the Free Software Foundation; either version 3, or (at your option) +;; any later version. + +;; This file is distributed in the hope that it will be useful, +;; but WITHOUT ANY WARRANTY; without even the implied warranty of +;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +;; GNU General Public License for more details. + +;; You should have received a copy of the GNU General Public License +;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; +;; +;;; Commentary: + +;; This file allows R (http://www.r-project.org) code to be applied to +;; emacs org-mode (http://orgmode.org) tables. When the +;; result of the analysis is a vector or matrix, it is output back +;; into the org-mode buffer as a new org table. Alternatively the R +;; code may be used to plot the data in the org table. It requires R to be +;; running in an inferior-ess-mode buffer (install Emacs Speaks +;; Statistics http://ess.r-project.org and issue M-x R). +;; +;; +;; The user interface is via two different options lines in the org +;; buffer. As is conventional in org-mode, these are lines starting +;; with `#+'. Lines starting with #+R: specify options in the +;; standard org style (option:value) and are used to specify certain +;; off-the-shelf transformations and plots of the table data. The +;; #+R: line is also used to specify the data to be analysed +;; (either an org table or a csv file), and to restrict the analysis +;; to certain columns etc. In lines starting #+RR: you can supply +;; literal R code, giving you full control over what you do with the +;; table. With point in the first #+R line, M-x org-R-apply +;; makes happen whatever has been specified in those lines. + +;; The best documentation is currently the Worg tutorial: +;; +;; http://orgmode.org/worg/org-tutorials/org-R/org-R.php + + +(defconst org-R-skeleton-funcall-1-arg + "%s(x[%s]%s)" + "Skeleton of a call to an R function. +E.g. barplot(x[,3:5], names.arg=rownames(x))") + +(defconst org-R-skeleton-funcall-2-args + "%s(x[,%s], x[,%s]%s)" + "Skeleton of a call to an R function which can take x and y + args.") + +(defconst org-R-write-org-table-def + "write.org.table <- function (x, write.rownames = TRUE) +{ + if(!is.null(dim(x)) && length(dim(x)) > 2) + stop(\"Object must be 1- or 2-dimensional\") ; + if(is.vector(x) || is.table(x) || is.factor(x) || is.array(x)) + x <- as.matrix(x) ; + if(!(is.matrix(x) || inherits(x, c('matrix', 'data.frame')))) { + invisible() ; + print(x) ; + stop(\"Object not recognised as 1- or 2-dimensional\") ; + } ; + if(is.null(colnames(x))) + colnames(x) <- rep('', ncol(x)) ; + if(write.rownames) + x <- cbind(rownames(x), x) ; + cat('|', paste(colnames(x), collapse = ' | '), '|\\n') ; + cat('|', paste(rep('----', ncol(x)), collapse = '+'), '|\\n', sep = '') ; + invisible(apply(x, 1, function(row) cat('|', paste(row, collapse = ' | '), '|\\n'))) ; +}" + "Definition of R function to write org table representation of R objects. +To see a more human-readable version of this, look at the code, +or type dput(write.org.table) RET at the R (inferior-ess-mode +buffer) prompt.") + + +(defun org-R-apply () + "Construct and evaluate an R function call. +Construct an R function corresponding to the #+R: and #+RR: +lines. R must be currently running in an inferior-ess-mode +buffer. The function evaluates any user-supplied R code in the +#+RR: line before the off-the-shelf actions specified in the #+R: +line. The user-supplied R code can operate on a variable called x +that is the org table represented as a data frame in R. Text +output from the R process may be inserted into the org buffer, as +an org table where appropriate." + (interactive) + (require 'ess) + (save-excursion + (beginning-of-line) + (unless (looking-at "#\\+RR?:") (error "Point must be in a #+R or #+RR line")) + (while (looking-at "#\\+RR?:") (forward-line -1)) + (forward-line) + ;; For the rest of the code in this file we are based at the + ;; beginning of the first #+R line + + ;; FIXME: if point is at the beginning of the #+RR? lines when + ;; this function is called, then tabular output gets inserted, + ;; leaving point up at the top of the tabular output. + + (let* ((options (org-R-get-options)) + (code (org-R-construct-code options)) + (infile (plist-get options :infile)) + (ext (if infile (file-name-extension infile))) + csv-file) + + (if (string-equal ext "csv") + (setq csv-file infile) + (setq csv-file + (org-R-export-to-csv + (make-temp-file "org-R-tmp" nil ".csv") options))) + + (org-R-eval code csv-file options) + + (delete-other-windows) ;; FIXME + (if (plist-get options :showcode) (org-R-showcode code))))) + +(defun org-R-apply-throughout-subtree () + "Call org-R-apply in every org-R block in current subtree." + ;; This currently relies on re-search-forward leaving point after + ;; the #+RR?: If point were at the beginning of the line, then + ;; tabular input would get inserted leaving point above the #+RR?:, + ;; and this would loop infinitely. Same for org-R-apply-to-buffer. + (interactive) + (save-excursion + (org-back-to-heading) + (while (re-search-forward + "^#\\+RR?:" + (save-excursion (org-end-of-subtree)) t) + (org-R-apply) + (forward-line) + (while (looking-at "#\\+RR?") + (forward-line))))) + +(defun org-R-apply-throughout-buffer () + "Call org-R-apply in every org-R block in the buffer." + (interactive) + (save-excursion + (goto-char (point-min)) + (while (re-search-forward "^#\\+RR?:" nil t) + (org-R-apply) + (forward-line) + (while (looking-at "#\\+RR?") + (forward-line))))) + +(defun org-R-construct-code (options) + "Construct the R function that implements the requested +behaviour. +The body of this function derives from two sources: + +1. Explicit R code which is read from lines starting with +#+RR: by org-R-get-user-code, and + +2. Off-the-shelf code corresponding to options specified in the +#+R: line. This code is constructed by +org-R-off-the-shelf-code." + (let ((user-code (org-R-get-user-code)) + (action (plist-get options :action))) + + (if (or (eq action 'tabulate) (eq action 'transpose)) + (setq options (plist-put options :output-to-buffer t))) + (format "function(x){%sx}" + (concat + (when user-code (concat user-code ";")) + (when action (concat (org-R-off-the-shelf-code options) ";")))))) + +(defun org-R-get-user-code (&optional R) + "Read user-supplied R code from #+RR: lines." + (let ((case-fold-search t)) + (save-excursion + (while (looking-at "^#\\+\\(RR?:\\) *\\(.*\\)") + (if (string= "RR:" (match-string 1)) + (setq R (concat R (when R ";") (match-string 2)))) + (forward-line)))) + R) + +(defun org-R-off-the-shelf-code (options) + "Return R code implementing the actions requested in the +#+R: lines." + + ;; This is a somewhat long function as it deals with several + ;; different cases, corresponding to all the off-the-shelf actions + ;; that have been implemented. + + (let* ((action (plist-get options :action)) + (cols (plist-get options :columns)) + (ncols (org-R-number-of-columns cols)) + (nxcols (nth 0 ncols)) + (nycols (nth 1 ncols)) + (cols-R (org-R-make-index-vectors cols)) + (xcols-R (nth 0 cols-R)) + (ycols-R (nth 1 cols-R)) + seq args largs extra-code title colour matrix-index) + + ;; I want this to affect options outside this function. Will it + ;; necessarily do so? (not if plist-put adds to head of the + ;; plist?) + (setq options (plist-put options :nxcols nxcols)) + + (cond ((eq action 'points) + (setq action 'plot) + (setq options (plist-put options :lines nil))) + ((eq action 'lines) + (setq action 'plot) + (setq options (plist-put options :lines t)))) + + (if (and (setq title (plist-get options :title)) (symbolp title)) + (setq title symbol-name title)) + + (setq args (plist-put args :main (concat "\"" title "\""))) + + (if (setq colour (or (plist-get options :colour) + (plist-get options :color) + (plist-get options :col))) + (setq args + (plist-put args :col + (concat "\"" (if (symbolp colour) (symbol-name colour) colour) "\"")))) + + (setq largs + (if (setq legend (plist-get options :legend)) + (plist-put largs :x + (concat "\"" (if (symbolp legend) (symbol-name legend) legend) "\"")) + (plist-put largs :x "\"topright\""))) + + (cond + ((null ycols-R) + ;; single set of columns; implicit x values + (if (null xcols-R) + (setq xcols-R "" matrix-index "") + (setq matrix-index (concat "," xcols-R))) + (cond + + ;;---------------------------------------------------------------------- + + ((eq action 'barplot) + (if (eq nxcols 1) + (progn + (setq args (plist-put args :names.arg "rownames(x)")) + (setq args (org-R-set-user-supplied-args args (plist-get options :args))) + (format org-R-skeleton-funcall-1-arg + "barplot" xcols-R + (concat ", " (org-R-plist-to-R-args args)))) + + (setq args (plist-put args :names.arg "colnames(x)")) + (setq args (plist-put args :col "seq(nrow(x))")) + (setq args (plist-put args :beside "TRUE")) + + (setq largs (plist-put largs :bty "\"n\"")) + ;; (setq largs (plist-put largs :lwd 10)) + (setq largs (plist-put largs :col "seq(nrow(x))")) + (setq largs (plist-put largs :legend "rownames(x)")) + + (setq args (org-R-set-user-supplied-args args (plist-get options :args))) + + (concat (format org-R-skeleton-funcall-1-arg + "barplot(as.matrix" matrix-index + (concat "), " (org-R-plist-to-R-args args))) + "; legend(" (org-R-plist-to-R-args largs) ")"))) + + ;;---------------------------------------------------------------------- + + ((eq action 'density) + (if (and nxcols (> nxcols 1)) + (error "Multiple columns not implemented for action:%s" action)) + + (setq args (plist-put args :xlab (concat "colnames(x)["xcols-R"]"))) + (setq args (org-R-set-user-supplied-args args (plist-get options :args))) + + (format org-R-skeleton-funcall-1-arg + "plot(density" matrix-index + (concat "), " (org-R-plist-to-R-args args)))) + + ;;---------------------------------------------------------------------- + + ((eq action 'hist) + (if (and nxcols (> nxcols 1)) + (error "Multiple columns not implemented for action:%s" action)) + (setq args (plist-put args :xlab (concat "colnames(x)["xcols-R"]"))) + (setq args (org-R-set-user-supplied-args args (plist-get options :args))) + (setq args (concat ", " (org-R-plist-to-R-args args))) + (format org-R-skeleton-funcall-1-arg "hist" matrix-index args)) + + ;;---------------------------------------------------------------------- + + ((eq action 'image) + (format org-R-skeleton-funcall-1-arg "image(as.matrix" matrix-index ")")) + + ;;---------------------------------------------------------------------- + + ((eq action 'plot) + (setq seq (concat "seq_along("xcols-R")")) + + (setq args (plist-put args :type (if (plist-get options :lines) "\"l\"" "\"p\""))) + (setq args (plist-put args :ylab (concat "colnames(x)["xcols-R"]"))) + (setq args (concat ", " (org-R-plist-to-R-args args))) + + (concat (format org-R-skeleton-funcall-1-arg + (if (eq nxcols 1) "plot" "matplot") matrix-index args) + extra-code)) + + ;;---------------------------------------------------------------------- + + ((eq action 'tabulate) + (concat + (if (plist-get options :sort) + (format org-R-skeleton-funcall-1-arg + "x <- sort(table" xcols-R "), decreasing=TRUE") + (format org-R-skeleton-funcall-1-arg "x <- table" matrix-index "")) + (if (eq nxcols 1) "; x <- data.frame(value=names(x), count=x[])"))) + + ;;---------------------------------------------------------------------- + + ((eq action 'transpose) + (format org-R-skeleton-funcall-1-arg "x <- t" matrix-index "")) + + ;;---------------------------------------------------------------------- + + ;; Don't recognise action: option, try applying it as the name of an R function. + + (t (format org-R-skeleton-funcall-1-arg + (concat "x <- " (symbol-name action)) matrix-index "")))) + + ;;---------------------------------------------------------------------- + + (ycols-R + ;; x and y columns specified + (cond + + ;;---------------------------------------------------------------------- + + ((eq action 'plot) + (unless (eq nxcols 1) (error "Multiple x-columns not implemented for action:plot")) + + (setq args + (plist-put + args :ylab + (concat "if(length("ycols-R") == 1) colnames(x)["ycols-R"] else ''"))) + (setq args (plist-put args :xlab (concat "colnames(x)["xcols-R"]"))) + + (setq args (plist-put args :type (if (plist-get options :lines) "\"l\"" "\"p\""))) + + (setq args (concat ", " (org-R-plist-to-R-args args))) + (setq seq (concat "seq_along("ycols-R")")) + + (setq largs (plist-put largs :col seq)) + (setq largs (plist-put largs :lty seq)) + (setq largs (plist-put largs :bty "\"n\"")) + (setq largs (plist-put largs :legend (concat "colnames(x)["ycols-R"]"))) + + (setq extra-code + (concat "; " + "if(length("ycols-R") > 1) " + "legend(" (org-R-plist-to-R-args largs) ")")) + + (concat (format org-R-skeleton-funcall-2-args + (if (and (eq nxcols 1) (eq nycols 1)) "plot" "matplot") + xcols-R ycols-R args) + extra-code)) + + ;;---------------------------------------------------------------------- + + (t (error "action:%s requires a single set of columns" (symbol-name action)))))))) + +(defun org-R-set-user-supplied-args (args user-args) + "Set user-supplied values in arguments plist." + (while (setq prop (pop user-args)) + (setq args (plist-put args prop (pop user-args)))) + args) + +(defun org-R-plist-to-R-args (plist) + "Convert a plist into a string of R arguments." + (let (arg-string arg) + (while (setq arg (pop plist)) + (string-match ":\\(\.*\\)" (symbol-name arg)) + (setq arg (match-string 1 (symbol-name arg))) + (setq arg-string + (concat + (if arg-string (concat arg-string ", ")) + (format "%s=%s" arg (pop plist))))) + arg-string)) + +(defun org-R-alist-to-R-args (alist) + "Convert an alist of (argument . val) pairs into a string of R arguments. +The alist is something like + '((arg1 . 1) + (arg2 . a)) +This isn't used, but it seems much nicer than +my plist equivalent. Is there a better way to write the plist +version? +" + (mapconcat + 'identity + (mapcar (lambda(pair) (format "%s = %s" (car pair) (cdr pair))) alist) + ", ")) + +(defun org-R-make-index-vectors (cols) + "Construct R indexing vectors as strings from lisp form. + +COLS is the lisp form given by the `columns:' option. It may +take the following forms: + +1. integer atom - the number of the column +2. symbol/string atom - the name of the column +3. list of length 1 - same as 1 or 2 above +4. list of length > 1 - specification of multiple columns as 1 or 2 above, unless it is +5. list of 2 lists - each list specifies (possibly multiple) columns + +In cases 1-4 this function returns a list of length 1, containing +the R index vector as a string. In case 5 this function returns a +list of two such index vectors. + +In cases 1 - 4, when a bivariate plot is requested such as by +`action:lines', the x values are implicit, i.e +1,2,...,number-of-rows. + +In case 4, an attempt is made to do something sensible with the +multiple columns, e.g. for `action:lines' they will be plotted +together on the same graph against the implicit x values, and for +`action:barplot' the bars corresponding to a single row will be +stacked on top of each other, or placed side by side, depending +on the value of the `beside' option. + +For `action:tabulate', if 2 columns are selected, a +two-dimensional table is created. If more than 2, then the +appropriately dimensioned table is computed and inserted using +the standard text representation of multi-dimensional arrays used +by R (as org does not currently have tables of dimension > 2). + +The straightforward case of case 5 is that both lists are of +length 1. For `action:plot' and `action:lines' these specify the +y and x coordinates of the points to be plotted or joined by +lines. + +The intention is that `org-R-apply' does something +corresponding to what would happen if you did the following in R: + +fun(x=tab[,xcols], y=tab[,ycols]) + +where fun is the R function implementing the desired +action (plotting/computation), tab is the org table, xcols are +the columns specified in cases 1-4 above, and ycols are the +second set of columns which might have been specified under case +5 above. For relevant R documentation see the help page +associated with the function xy.coords, e.g. by typing ?xy.coords +at the R prompt. + +The following won't work with case 5: `tabulate' +" + (defun org-R-make-index-vector (cols) + "Return the R indexing vector (as a string) corresponding to +the lisp form COLS. In this function, COLS is a either a list of +atoms, or an atom, i.e. in the form of cases 1-4" + (when cols + (let (to-stringf) + (unless (listp cols) (setq cols (list cols))) + (setq to-stringf + (cond ((car (mapcar 'symbolp cols)) + (lambda (symbol) (concat "\"" (symbol-name symbol) "\""))) + ((car (mapcar 'integerp cols)) + 'int-to-string) + ((car (mapcar 'stringp cols)) + (lambda (string) (concat "\"" string "\""))) + (t (error "Column selection should be symbol, integer or string: %S" cols)))) + (concat (when (> (length cols) 1) "c(") + (mapconcat to-stringf cols ",") + (when (> (length cols) 1) ")"))))) + + (if (and (listp cols) (listp (car cols))) + (mapcar 'org-R-make-index-vector cols) ;; case 5 + (list (org-R-make-index-vector cols)))) ;; other cases + +(defun org-R-number-of-columns (cols) + (defun f (c) (if (listp c) (length c) 1)) + (if (and (listp cols) (listp (car cols))) + (mapcar 'f cols) + (list (f cols)))) + +(defun org-R-eval (R-function csv-file options) + "Apply an R function to tabular data and receive output as an org table. + +R-FUNCTION is a string; it may be simply the name of an +appropriate R function (e.g. \"summary\", \"plot\"), or a +user-defined anonymous function of the form +\"(function(data.frame) {...})\". It will receive as its first +argument the org table as an R 'data frame' -- a table-like +structure which can have columns containing different types of +data -- numeric, character etc. + +The R function may produce graphical and/or text output. If it +produces text output, and the replace:t is specified, and if +there is a table immediately above the #+R lines, then it is +replaced by the text output. Otherwise the text output is +inserted above the #+R lines. +" + (let ((transit-buffer "org-R-transit") + (infile (plist-get options :infile)) + (output-file (plist-get options :outfile)) + (title (plist-get options :title)) + output-format graphics-output-file width height) + + (unless (not output-file) + ;; We are writing output to file. Determine file format and + ;; location, and open graphics device if necessary. + (if (string-match + "\\(.*\.\\)?\\(org\\|png\\|jpg\\|jpeg\\|pdf\\|ps\\|bmp\\|tiff\\)$" + output-file) + (setq output-format (match-string 2 output-file)) + (error "Did not recognise file name suffix %s as available output format" + (match-string 2 output-file))) + (unless (match-string 1 output-file) + ;; only suffix provided: store in org-attach dir + (require 'org-attach) + (let ((temporary-file-directory (org-attach-dir t))) + (setq output-file + (make-temp-file + "org-R-output-" nil (concat "." output-format))))) + (if (eq output-format "jpg") (setq output-format "jpeg")) + (setq graphics-output-file (not (string-equal output-format "org"))) + (if graphics-output-file ;; open the graphics device + (ess-execute + (concat output-format "(file=\"" output-file "\"" + (if (setq width (plist-get options :width)) + (format ", width=%d" width)) + (if (setq height (plist-get options :height)) + (format ", height=%d" height)) ")")))) + + ;; Apply R code to table (which is now stored as a csv file) + ;; does it matter whether this uses ess-command or ess-execute? + + ;; First evaluate function definition for R -> org table conversion + (ess-execute (replace-regexp-in-string "\n" " " org-R-write-org-table-def) + nil transit-buffer) + + ;; FIXME: why not eval the function def together with the function call + ;; as in the commented out line below (it didn't work for some reason) + (ess-execute + (concat + ;; (replace-regexp-in-string "\n" " " org-R-write-org-table-def) ";" + (org-R-make-expr R-function csv-file options)) nil transit-buffer) + + (save-excursion + (set-buffer (concat "*" transit-buffer "*")) + (unless (or (looking-at "$") + (string-equal (buffer-substring-no-properties 1 2) "|")) + (error "Error in R evaluation:\n%s" (buffer-string)))) + + + (if csv-file + (unless (and infile + (string-equal (file-name-extension infile) "csv")) + (delete-file csv-file))) + + (if graphics-output-file (ess-execute "dev.off()")) ;; Close graphics device + + (unless (or graphics-output-file + (not (plist-get options :output-to-buffer))) + ;; Send tabular output to a org buffer as new org + ;; table. Recall that we are currently at the beginning of the + ;; first #+R line + (if (and output-file graphics-output-file) + (error "output-to-buffer and graphics-output-file both t")) + + (save-excursion + (if output-file + (progn (set-buffer (find-file-noselect output-file)) + (delete-region (point-min) (point-max))) + (if (plist-get options :replace) + (progn ;; kill a table iff in one or one ends on the previous line + (delete-region (org-table-begin) (org-table-end)) + (save-excursion + (forward-line -1) + (if (looking-at "#\\+TBLNAME") + (delete-region (point) (1+ (point-at-eol)))))))) + (if title (insert "#+TBLNAME:" title "\n")) + (insert-buffer-substring (concat "*" transit-buffer "*")) + (org-table-align) + (if output-file (save-buffer)))) + + ;; We might be linking to graphical output, or to org output in + ;; another file. Either way, point is still at the beginning of + ;; the first #+R line. + (unless (not output-file) + (save-excursion + (forward-line -1) + (if (looking-at "\\[\\[file:") + (delete-region (point) (1+ (point-at-eol))))) + (insert (org-make-link-string + (concat "file:" output-file) + (unless (plist-get options :inline) + (or title (concat output-format " output")))) "\n")) + + (kill-buffer (concat "*" transit-buffer "*")))) + + +(defun org-R-export-to-csv (csv-file options) + "Find and export org table to csv. + +If the intable: option has not been supplied, then the table must +end on the line immediately above the #+R lines. Otherwise, +the remote table referenced by the intable: option is found using +org-R-find-table. If options:infile has been set then this is the +org file containing the table. See the docstring of +org-R-find-table for details." + (let ((tbl-name-or-id (plist-get options :intable)) + (org-file (plist-get options :infile)) tbl-marker) + + (if (and org-file + (not (string-equal (file-name-extension org-file) "org"))) + (error "File %s extension is not .csv so should be .org")) + + (save-excursion + (if tbl-name-or-id + ;; a remote table has been specified -- move into it + (progn + (if org-file (set-buffer (find-file-noselect org-file))) + (setq tbl-marker (org-R-find-table tbl-name-or-id 'marker)) + (set-buffer (marker-buffer tbl-marker)) + (goto-char (marker-position tbl-marker))) + (forward-line -1)) ;; move into table above + (if (looking-at "[ \t]*|") + (progn (org-table-export csv-file "orgtbl-to-csv") csv-file) + nil)))) + +(defun org-R-find-table (name-or-id &optional markerp) + "Return location of a table. + +NAME-OR-ID may be the name of a +table in the current file as set by a \"#+TBLNAME:\" directive. +The first table following this line will then be used. +Alternatively, it may be an ID referring to any entry, perhaps in +a different file. In this case, the first table in that entry +will be referenced. The location is returned as a marker pointing +to the beginning of the first line of the table. + +This is taken from the first part of org-table-get-remote-range +in org-table.el. +" + (cond + ((symbolp name-or-id) (setq name-or-id (symbol-name name-or-id))) + ((numberp name-or-id) (setq name-or-id (number-to-string name-or-id)))) + (save-match-data + (let ((id-loc nil) (case-fold-search t) buffer loc) + (save-excursion + (save-restriction + (widen) + (save-excursion + (goto-char (point-min)) + (if (re-search-forward + (concat "^#\\+TBLNAME:[ \t]*" (regexp-quote name-or-id) "[ \t]*$") + nil t) + ;; OK, we've found a matching table name in this buffer. + (setq buffer (current-buffer) loc (match-beginning 0)) + ;; It's not a table name in this buffer. It must be an entry id. + ;; obtain a marker pointing to it. + (setq id-loc (org-id-find name-or-id 'marker) + buffer (marker-buffer id-loc) + loc (marker-position id-loc)) + (move-marker id-loc nil))) ;; disable the marker + ;; (switch-to-buffer buffer) + (set-buffer buffer) + ;; OK, so now we're in the right buffer, and loc is either + ;; the beginning of the #+TBLNAME line, or the location of the entry + ;; either way we need to search forward to get to the beginning of the table + (save-excursion + (save-restriction + (widen) + (goto-char loc) + (forward-char 1) + ;; The following regexp search finds the beginning of + ;; the next table in this entry. If it gets to the next + ;; entry before the next table, then it signals failure. + (unless (and (re-search-forward "^\\(\\*+ \\)\\|[ \t]*|" nil t) + (not (match-beginning 1))) + (error "Cannot find a table at NAME or ID %s" name-or-id)) + (if markerp + (move-marker (make-marker) (point-at-bol) (current-buffer)) + (error "Option to return cons cell not implemented. + It should return (file-name . position) to be + consistent with functions in org-id.el"))))))))) + +(defun org-R-make-expr (R-function csv-file options) + "Construct R code to read data, analyse it and write output." + + (let ((rownames (plist-get options :rownames)) + (colnames (plist-get options :colnames)) + (action (plist-get options :action)) + (replace (plist-get options :replace))) + + (if (and csv-file (symbolp csv-file)) + (setq csv-file (symbol-name csv-file))) + + (format "write.org.table((%s)(%s), write.rownames=%s)" + R-function + (if csv-file + (format + "read.csv(\"%s\", header=%s, row.names=%s)" + csv-file + + ;; Do we treat first row as colnames? Yes by default + ;; FIXME: should really check for hline + (if colnames "TRUE" "FALSE") + + ;; Do we use a column as rownames? Not unless rownames: is specified + (if rownames "1" "NULL")) + "NULL") + + ;; Do we write rownames into org table? + (cond ((eq action 'tabulate) + (if (eq (plist-get options :nxcols) 1) "FALSE" "TRUE")) + ((eq action 'transpose) (if colnames "TRUE" "FALSE")) + (rownames "TRUE") + (t "TRUE"))))) + +(defun org-R-get-options () + "Parse the #+R: lines and return the options and values as a p-list." + (let ((opts '( + (:infile . "infile") + (:intable . "intable") + (:rownames . "rownames") + (:colnames . "colnames") + (:columns . "columns") + + (:action . "action") + (:args . "args") + + (:outfile . "outfile") + (:replace . "replace") + (:title . "title") + (:legend . "legend") + (:colour . "colour") + (:color . "color") + (:col . "col") + (:height . "height") + (:width . "width") + (:lines . "lines") + (:sort . "sort") + (:inline . "inline") + + (:output-to-buffer . "output-to-buffer") + + (:showcode . "showcode"))) + (regexp ":\\(\"[^\"]*\"\\|(([^)]*) *([^)]*))\\|([^)]*)\\|[^ \t\n\r;,.]*\\)") + (case-fold-search t) p) + + ;; FIXME: set default options properly + (setq p (plist-put p :output-to-buffer t)) ;; FIXME: hack: null options plist is bad news + (setq p (plist-put p :replace t)) + (setq p (plist-put p :rownames nil)) + (setq p (plist-put p :colnames t)) + (setq p (plist-put p :inline nil)) + + (save-excursion + (while (looking-at "^#\\+\\(RR?:+\\) *\\(.*\\)") + (if (string= "R:" (match-string 1)) + (setq p (org-R-add-options-to-plist p (match-string 2) opts regexp))) + (forward-line))) + p)) + +(defun org-R-add-options-to-plist (p opt-string op regexp) + "Parse a #+R: line and set values in the property list p. +This function is adapted from similar functions in org-exp.el +and org-plot.el. It might be a good idea to have a single +function serving these three files' needs." + ;; Adapted from org-exp.el and org-plot.el + (let (o) + (when opt-string + (while (setq o (pop op)) + (if (string-match + (concat (regexp-quote (cdr o)) regexp) + opt-string) + (setq p (plist-put p (car o) + (car (read-from-string + (match-string 1 opt-string))))))))) + p) + + +(defun org-R-sanitise-options (options) + (error "not used yet") + (let (should-be-strings '(title legend colour color col csv))) + ) +(defun org-R-showcode (R) + "Display R function constructed by org-R in a new R-mode +buffer." + (split-window-vertically) + (switch-to-buffer "*org-table.R*") + (kill-region (point-min) (point-max)) + (R-mode) + (insert (replace-regexp-in-string + ";" "\n" (replace-regexp-in-string "\\([{}]\\)" "\n\\1\n" R))) + ;; (mark-whole-buffer) + ;; (indent-region) + ;; why doesn't that do what I hoped? + ) + +(defun org-R-get-remote-range (name-or-id form) + "Get a field value or a list of values in a range from table at ID. + +This is a refactoring of Carsten's original version. I have +extracted the first bit of his function and named it +org-R-find-table (which would presumably be called something like +org-table-find-table or org-id-find-table if this were accepted). + +--- + +Get a field value or a list of values in a range from table at ID. + +NAME-OR-ID may be the name of a table in the current file as set by +a \"#+TBLNAME:\" directive. The first table following this line +will then be used. Alternatively, it may be an ID referring to +any entry, possibly in a different file. In this case, the first table +in that entry will be referenced. +FORM is a field or range descriptor like \"@2$3\" or or \"B3\" or +\"@I$2..@II$2\". All the references must be absolute, not relative. + +The return value is either a single string for a single field, or a +list of the fields in the rectangle." + + (let ((tbl-marker (org-R-find-table name-or-id 'marker)) + org-table-column-names org-table-column-name-regexp + org-table-local-parameters org-table-named-field-locations + org-table-current-line-types org-table-current-begin-line + org-table-current-begin-pos org-table-dlines + org-table-hlines org-table-last-alignment + org-table-last-column-widths org-table-last-alignment + org-table-last-column-widths tbeg) + + (save-excursion + (set-buffer (marker-buffer tbl-marker)) + (goto-char (marker-position tbl-marker)) + (org-table-get-specials) + (setq form (org-table-formula-substitute-names form)) + (if (and (string-match org-table-range-regexp form) + (> (length (match-string 0 form)) 1)) + (save-match-data + (org-table-get-range (match-string 0 form) (point) 1)) + form)))) + +(provide 'org-R) diff --git a/lisp/ChangeLog b/lisp/ChangeLog index e72150a..d9f730b 100755 --- a/lisp/ChangeLog +++ b/lisp/ChangeLog @@ -1,4 +1,4 @@ -2009-02-18 Carsten Dominik <carsten.dominik@gmail.com> + * org.el (org-modules): Add an entry for org-R.el. * org-agenda.el (org-agenda-todo-ignore-with-date) (org-agenda-todo-ignore-scheduled) diff --git a/lisp/org.el b/lisp/org.el index 5d7f742..842c6d8 100644 --- a/lisp/org.el +++ b/lisp/org.el @@ -193,6 +193,7 @@ to add the symbol `xyz', and the package must have a call to (const :tag "C man: Support for links to manpages in Org-mode" org-man) (const :tag "C mtags: Support for muse-like tags" org-mtags) (const :tag "C panel: Simple routines for us with bad memory" org-panel) + (const :tag "C R: Computation using the R language" org-R) (const :tag "C registry: A registry for Org links" org-registry) (const :tag "C org2rem: Convert org appointments into reminders" org2rem) (const :tag "C screen: Visit screen sessions through Org-mode links" org-screen) |