
376 lines
16 KiB
Raw Normal View History

2019-11-30 08:46:49 +01:00
;; -*- lexical-binding: t -*-
;;; ob-ein.el --- org-babel functions for template evaluation
;; Copyright (C) John M. Miller
;; Author: John M. Miller <millejoh at mac.com>
;;; License:
;; This file is NOT part of GNU Emacs.
;; ob-ein.el is free software: you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; ob-ein.el is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with ob-ein.el. If not, see <http://www.gnu.org/licenses/>.
;;; Commentary:
;; Support executing org-babel source blocks using EIN worksheets.
;;; Credits:
;; Uses code from https://github.com/gregsexton/ob-ipython (MIT License)
;;; Code:
(require 'ob)
(require 'ein-utils)
2020-02-03 19:45:34 +01:00
(require 'anaphora)
2019-11-30 08:46:49 +01:00
(autoload 'org-element-property "org-element")
(autoload 'org-element-context "org-element")
2020-02-03 19:45:34 +01:00
(autoload 'org-id-new "org-id")
(autoload 'org-redisplay-inline-images "org")
2019-11-30 08:46:49 +01:00
(autoload 'ein:notebooklist-new-notebook-with-name "ein-notebooklist")
(autoload 'ein:notebooklist-login "ein-notebooklist")
(autoload 'ein:notebook-get-opened-notebook "ein-notebook")
(autoload 'ein:notebook-url "ein-notebook")
(autoload 'ein:notebook-open "ein-notebook")
(autoload 'ein:notebook-close "ein-notebook")
(autoload 'ein:process-url-or-port "ein-process")
(autoload 'ein:process-url-match "ein-process")
(autoload 'ein:process-refresh-processes "ein-process")
(autoload 'ein:jupyter-server-conn-info "ein-jupyter")
(autoload 'ein:jupyter-server-start "ein-jupyter")
(autoload 'ein:shared-output-get-cell "ein-shared-output")
(autoload 'ein:shared-output-eval-string "ein-shared-output")
(autoload 'ein:kernel-live-p "ein-kernel")
2020-02-03 19:45:34 +01:00
(autoload 'ein:query-singleton-ajax "ein-query")
(autoload 'ein:output-area-case-type "ein-output-area")
(autoload 'ein:log "ein-log")
2019-11-30 08:46:49 +01:00
(defvar *ob-ein-sentinel* "[....]"
"Placeholder string replaced after async cell execution")
(defcustom ob-ein-timeout-seconds 600
"Maximum seconds to wait for block to finish (for synchronous operations)."
:type 'integer
:group 'ein)
(defcustom ob-ein-languages
'(("ein" . python)
("ein-python" . python)
("ein-R" . R)
("ein-r" . R)
2020-02-03 19:45:34 +01:00
("ein-julia" . julia))
2019-11-30 08:46:49 +01:00
"ob-ein has knowledge of these (ein-LANG . LANG-MODE) pairs."
:type '(repeat (cons string symbol))
:group 'ein)
(defcustom ob-ein-anonymous-path ".%s.ipynb"
"When session header doesn't specify ipynb, prosecute all interactions for a given language in this throwaway notebook (substitute %s with language)."
:type '(string)
:group 'ein)
(defsubst ob-ein-anonymous-p (path)
"Return t if PATH looks like ob-ein-anonymous-path. Fragile"
(string-match (replace-regexp-in-string "%s" ".+"
(replace-regexp-in-string "\\." "\\\\." ob-ein-anonymous-path))
(defcustom ob-ein-inline-image-directory "ein-images"
"Store ob-ein images here."
:group 'ein
2020-02-03 19:45:34 +01:00
:type 'directory)
2019-11-30 08:46:49 +01:00
(defcustom ob-ein-default-header-args:ein nil
"No documentation."
:group 'ein
:type '(repeat string))
(defun ob-ein--inline-image-info (value)
(let* ((f (md5 value))
(d ob-ein-inline-image-directory)
(tf (concat d "/ob-ein-" f ".png")))
(unless (file-directory-p d)
(make-directory d 'parents))
(defun ob-ein--write-base64-image (img-string file)
(with-temp-file file
(let ((buffer-read-only nil)
(buffer-file-coding-system 'binary)
(require-final-newline nil)
(file-precious-flag t))
(insert img-string)
(base64-decode-region (point-min) (point-max)))))
2020-02-03 19:45:34 +01:00
(defun ob-ein--proxy-images (json explicit-file)
(let (result)
(cl-case type
((:image/svg+xml :image/png :image/jpeg)
(let ((file (or explicit-file (ob-ein--inline-image-info value))))
(ob-ein--write-base64-image value file)
(setq result (format "[[file:%s]]" file))))
(setq result value))))
2019-11-30 08:46:49 +01:00
(defun ob-ein--process-outputs (outputs params)
(let ((file (cdr (assoc :image params))))
(ein:join-str "\n"
(cl-loop for o in outputs
2020-02-03 19:45:34 +01:00
collecting (ob-ein--proxy-images o file)))))
2019-11-30 08:46:49 +01:00
(defun ob-ein--get-name-create (src-block-info)
"Get the name of a src block or add a uuid as the name."
2020-02-03 19:45:34 +01:00
(if-let ((name (fifth src-block-info)))
2019-11-30 08:46:49 +01:00
(let ((el (org-element-context))
(id (org-id-new 'none)))
(goto-char (org-element-property :begin el))
(insert (format "#+NAME: %s" id))
(defun ob-ein--babelize-lang (lang-name lang-mode)
"Stand-up LANG-NAME as a babelized language with LANG-MODE syntax table.
Based on ob-ipython--configure-kernel."
(add-to-list 'org-src-lang-modes `(,lang-name . ,lang-mode))
(defvaralias (intern (concat "org-babel-default-header-args:" lang-name))
(fset (intern (concat "org-babel-execute:" lang-name))
`(lambda (body params)
2020-02-03 19:45:34 +01:00
"Should get rid of accommodating org-babel-variable-assignments.
We don't test it, and finding a module named ob-LANG-MODE won't work generally,
e.g., ob-c++ is not ob-C.el."
2019-11-30 08:46:49 +01:00
(require (quote ,(intern (format "ob-%s" lang-mode))) nil t)
2020-02-03 19:45:34 +01:00
;; hack because ob-ein loads independently of ein
(custom-set-variables '(python-indent-guess-indent-offset-verbose nil))
(let ((parser
,(intern (format "org-babel-variable-assignments:%s" lang-mode)))))
(if (fboundp parser)
body params (funcall (symbol-function parser) params))
(defun ob-ein--execute-body (body params)
2019-11-30 08:46:49 +01:00
(let* ((buffer (current-buffer))
(processed-params (org-babel-process-params params))
(result-params (cdr (assq :result-params params)))
(session (or (ein:aand (cdr (assoc :session processed-params))
(unless (string= "none" it)
(format "%s" it)))
(lang (nth 0 (org-babel-get-src-block-info)))
(kernelspec (or (cdr (assoc :kernelspec processed-params))
2020-02-03 19:45:34 +01:00
(aif (cdr (assoc lang org-src-lang-modes))
2019-11-30 08:46:49 +01:00
(cons 'language (format "%s" it))
(error "ob-ein--execute-body: %s not among %s"
lang (mapcar #'car org-src-lang-modes)))))
(name (ob-ein--get-name-create (org-babel-get-src-block-info)))
(callback (lambda (notebook)
2020-02-03 19:45:34 +01:00
2019-11-30 08:46:49 +01:00
(ein:$notebook-kernel notebook)
(cl-assert (not (stringp (org-babel-goto-named-src-block name))))
(org-babel-insert-result *ob-ein-sentinel* result-params))
(ob-ein--initiate-session session kernelspec callback)
(if (ein:eval-if-bound 'org-current-export-file)
(cl-loop with interval = 2000
2020-02-03 19:45:34 +01:00
with pending = t
repeat (/ (* ob-ein-timeout-seconds 1000) interval)
do (progn
(org-babel-goto-named-result name)
(forward-line 1)
(setq pending (re-search-forward
(regexp-quote *ob-ein-sentinel*)
(org-babel-result-end) t)))
until (not pending)
do (sleep-for 0 interval)
finally return
(if pending
(prog1 ""
(ein:log 'error "ob-ein--execute-body: %s timed out" name))
(ein:oref-safe (ein:shared-output-get-cell) 'outputs)
2019-11-30 08:46:49 +01:00
(defsubst ob-ein--execute-async-callback (buffer params result-params name)
"Callback of 1-arity (the shared output cell) to update org buffer when
`ein:shared-output-eval-string' completes."
(lambda (buffer* params* result-params* name* cell)
2020-02-03 19:45:34 +01:00
(let* ((raw (aif (ein:oref-safe cell 'traceback)
2019-11-30 08:46:49 +01:00
(ansi-color-apply (ein:join-str "\n" it))
(ein:oref-safe cell 'outputs) params*)))
(let ((tmp-file (org-babel-temp-file "ein-")))
(with-temp-file tmp-file raw)
(org-babel-result-cond result-params*
raw (org-babel-import-elisp-from-file tmp-file '(16)))))
(info (org-babel-get-src-block-info 'light)))
(ein:log 'debug "ob-ein--execute-async-callback %s \"%s\" %s" name* result buffer*)
(with-current-buffer buffer*
(unless (stringp (org-babel-goto-named-src-block name*)) ;; stringp=error
(when info ;; kill #+RESULTS: (no-name)
(setf (nth 4 info) nil)
(org-babel-remove-result info))
(org-babel-remove-result) ;; kill #+RESULTS: name
(cdr (assoc :result-params
2020-02-03 19:45:34 +01:00
(third (org-babel-get-src-block-info)))))
2019-11-30 08:46:49 +01:00
buffer params result-params name))
(defun ob-ein--execute-async (buffer body kernel params result-params name)
"As `ein:shared-output-get-cell' is a singleton, ob-ein can only execute blocks
one at a time. Further, we do not order the queued up blocks!"
(deferred:lambda ()
(let ((cell (ein:shared-output-get-cell)))
(if (eq (slot-value cell 'callback) #'ignore)
(let ((callback
(ob-ein--execute-async-callback buffer params
result-params name)))
(setf (slot-value cell 'callback) callback))
;; still pending previous callback
(deferred:nextc (deferred:wait 1200) self)))))
(deferred:nextc it
(lambda (_x)
2020-02-03 19:45:34 +01:00
(ein:shared-output-eval-string kernel body)))))
2019-11-30 08:46:49 +01:00
(defun ob-ein--parse-session (session)
2020-02-03 19:45:34 +01:00
(multiple-value-bind (url-or-port _password) (ein:jupyter-server-conn-info)
2019-11-30 08:46:49 +01:00
(let ((tokens (split-string session "/"))
(parsed-url (url-generic-parse-url session)))
(cond ((null (url-host parsed-url))
(let* ((candidate (apply #'ein:url (car tokens) (cdr tokens)))
(parsed-candidate (url-generic-parse-url candidate))
(missing (url-scheme-get-property
(url-type parsed-candidate)
(if (and url-or-port
(= (url-port parsed-candidate) missing))
(apply #'ein:url url-or-port (cdr tokens))
(t (ein:url session))))))
2020-02-03 19:45:34 +01:00
(defun ob-ein--initiate-session (session kernelspec callback)
2019-11-30 08:46:49 +01:00
"Retrieve notebook based on SESSION path and KERNELSPEC, starting jupyter instance
if necessary. Install CALLBACK (i.e., cell execution) upon notebook retrieval."
(let* ((nbpath (ob-ein--parse-session session))
2020-02-03 19:45:34 +01:00
(info (org-babel-get-src-block-info))
2019-11-30 08:46:49 +01:00
(anonymous-path (format ob-ein-anonymous-path (nth 0 info)))
(parsed-url (url-generic-parse-url nbpath))
(slash-path (car (url-path-and-query parsed-url)))
(path (if (string= slash-path "") anonymous-path
(substring slash-path 1)))
(url-or-port (if (string= slash-path "")
(substring nbpath 0 (- (length slash-path)))))
(notebook (ein:notebook-get-opened-notebook url-or-port path))
(callback-nbopen (lambda (nb _created)
(cl-loop repeat 50
2020-02-03 19:45:34 +01:00
for live-p = (ein:kernel-live-p (ein:$notebook-kernel nb))
until live-p
do (sleep-for 0 300)
do (if (not live-p)
(ein:log 'error
"Kernel for %s failed to launch"
(ein:$notebook-notebook-name nb))
(funcall callback nb)))))
2019-11-30 08:46:49 +01:00
(errback-nbopen (lambda (url-or-port status-code)
(if (eq status-code 404)
url-or-port kernelspec path callback-nbopen t))))
(callback-login (lambda (_buffer url-or-port)
(ein:notebook-open url-or-port path kernelspec
callback-nbopen errback-nbopen t))))
(cond ((and notebook
(string= path anonymous-path)
(stringp kernelspec)
(not (equal (ein:$kernelspec-name (ein:$notebook-kernelspec notebook))
(ein:log 'debug "ob-ein--initiate-session: switching %s from %s to %s"
path (ein:$kernelspec-name (ein:$notebook-kernelspec notebook))
(cl-letf (((symbol-function 'y-or-n-p) #'ignore))
2020-02-03 19:45:34 +01:00
(ein:notebook-close notebook))
(ein:query-singleton-ajax (ein:notebook-url notebook)
:type "DELETE")
2019-11-30 08:46:49 +01:00
(cl-loop repeat 8
2020-02-03 19:45:34 +01:00
with fullpath = (concat (file-name-as-directory nbpath) path)
for extant = (file-exists-p fullpath)
until (not extant)
do (sleep-for 0 500)
finally do (if extant
(format "cannot delete path=%s nbpath=%s"
fullpath nbpath))
(ob-ein--initiate-session session kernelspec callback))))
2019-11-30 08:46:49 +01:00
(notebook (funcall callback notebook))
((string= (url-host parsed-url) ein:url-localhost)
2020-02-03 19:45:34 +01:00
(aif (ein:process-url-match nbpath)
2019-11-30 08:46:49 +01:00
(ein:notebooklist-login (ein:process-url-or-port it) callback-login)
2020-02-03 19:45:34 +01:00
(executable-find (or (ein:eval-if-bound 'ein:jupyter-server-command)
2019-11-30 08:46:49 +01:00
(read-directory-name "Notebook directory: " default-directory)
(let* ((port (url-port parsed-url))
(avoid (url-scheme-get-property (url-type parsed-url) 'default-port)))
(cond ((= port avoid) nil)
(t (url-port parsed-url)))))))
(t (ein:notebooklist-login url-or-port callback-login)))))
(cl-loop for (lang . mode) in ob-ein-languages
2020-02-03 19:45:34 +01:00
do (ob-ein--babelize-lang lang mode))
2019-11-30 08:46:49 +01:00
(if (featurep 'org)
(let* ((orig (get 'org-babel-load-languages 'custom-type))
(orig-cdr (cdr orig))
(choices (plist-get orig-cdr :key-type)))
(push '(const :tag "Ein" ein) (nthcdr 1 choices))
(put 'org-babel-load-languages 'custom-type
(cons (car orig) (plist-put orig-cdr :key-type choices)))))
(provide 'ob-ein)