emacs.d/elpa/racket-mode-20200411.1959/racket/commands/check-syntax.rkt

#lang racket/base

(require (for-syntax racket/base)
         racket/format
         (only-in racket/list remove-duplicates)
         racket/match
         racket/set
         racket/class
         drracket/check-syntax
         (only-in version/utils version<=?)
         "../imports.rkt"
         "../syntax.rkt"
         "../util.rkt")

(provide check-syntax)

(module+ test
  (require rackunit))

;; Our front-end issues check-syntax requests after the user edits a
;; buffer, plus a short idle delay (e.g. 1 second).
;;
;; On complex inputs it can take many seconds to expand and analyze.
;; (By far mostly the expansion; although we do cache expanded syntax,
;; that doesn't always help.)
;;
;; As a result, we might be called to do a path-str for which a
;; previous command thread is still running. Although that will work
;; _correctly_, eventually, it is wasteful -- both here in the
;; back-end (calculating) and in the front-end (updating buffer
;; properties).
;;
;; Instead: We'd like to kill the old command thread and inform our
;; front-end that the old command was "canceled". We can do so here
;; simply by `break-threading`ing the thread already running the
;; command for the same file.
;;
;; How/why this works: See how command-server.rkt handles exn:break by
;; returning a `(break)` response, and, how racket-cmd.el handles that
;; by doing nothing (except cleaning up its nonce->callback
;; hash-table).

(define check-syntax
  (let ([sema (make-semaphore 1)] ;guard concurrent use of ht
        [ht   (make-hash)])       ;path-str -> thread
    (λ (path-str code-str)
      (dynamic-wind
        (λ () (call-with-semaphore
               sema
               (λ ()
                 (define (break-thread/log thd)
                   (log-racket-mode-info "cancel ~v" thd)
                   (break-thread thd))
                 (cond [(hash-ref ht path-str #f) => break-thread/log])
                 (hash-set! ht path-str (current-thread)))))
        (λ () (do-check-syntax path-str code-str))
        (λ () (call-with-semaphore
               sema
               (λ ()
                 (hash-remove! ht path-str))))))))

;; Note: Instead of using the `show-content` wrapper, we give already
;; fully expanded syntax directly to `make-traversal`. Why? Expansion
;; can be slow. 1. We need exp stx for other purposes here. Dumb to
;; expand twice. 2. We might not even need to expand once, now:
;; string->expanded-syntax maintains a cache.
;;
;; [One nuance of caching expanded syntax is that we also cache the
;; namespace used while expanding -- that needs to be the
;; current-namespace for things like module->imports. Likewise
;; current-load-relative-directory. That is why
;; string->expanded-syntax uses a "call-with" "continuation style": it
;; sets parameters when calling the continuation function.]

(define (do-check-syntax path-str code-str)
  (define path (string->path path-str))
  (parameterize ([error-display-handler (our-error-display-handler path-str code-str)]
                 [pre-exn-errors '()])
    (with-handlers ([exn:fail? (handle-fail path-str code-str)])
      (with-time/log (~a "total " path-str)
        (string->expanded-syntax path
                                 code-str
                                 (analyze path code-str))))))

(define ((analyze path code-str) stx)
  (define o (new annotations-collector%
                 [src      path]
                 [code-str code-str]))
  (parameterize ([current-annotations o])
    (define-values (expanded-expression expansion-completed)
      (make-traversal (current-namespace)
                      (current-load-relative-directory)))
    (with-time/log 'drracket/check-syntax/expanded-expression
      (expanded-expression stx))
    (with-time/log 'drracket/check-syntax/expansion-completed
      (expansion-completed)))

  (define annotations (send o get-annotations))

  (define completions-set (send o get-locals))
  (with-time/log 'imports
    (imports stx completions-set))
  (define completions (sort (set->list completions-set)
                            string<=?))
  (list 'check-syntax-ok
        (cons 'completions completions)
        (cons 'annotations annotations)))

(define annotations-collector%
  (class (annotations-mixin object%)
    (init-field src code-str)

    (define infos (mutable-set))
    (define ht-defs/uses (make-hash))
    (define locals (mutable-set))

    ;; Give infos all a common prefix so we can sort.
    (define (item sym beg end . more)
      (list* sym (add1 beg) (add1 end) more))

    ;; I've seen drracket/check-syntax return bogus positions for e.g.
    ;; add-mouse-over-status so here's some validation.
    (define code-len (string-length code-str))
    (define (valid-pos? pos) (and (<= 0 pos) (< pos code-len)))
    (define (valid-beg/end? beg end)
      (and (< beg end) (valid-pos? beg) (valid-pos? end)))

    (define/override (syncheck:find-source-object stx)
      (and (equal? src (syntax-source stx))
           src))

    #;(define/override (syncheck:add-tail-arrow _from-text _from-pos _to-text to-pos) (void))

    (define/override (syncheck:add-arrow/name-dup/pxpy
                      _def-text def-beg def-end _def-px _def-py
                      _use-text use-beg use-end _use-px _use-py
                      _actual? _level require-arrow? _name-dup?)
      ;; Consolidate the add-arrow/name-dup items into a hash table
      ;; with one item per definition. The key is the definition position.
      ;; The value is the set of its uses' positions.
      (hash-update! ht-defs/uses
                    (list (substring code-str def-beg def-end)
                          (match require-arrow?
                            ['module-lang 'module-lang]
                            [#t           'import]
                            [#f           'local])
                          (add1 def-beg)
                          (add1 def-end))
                    (λ (v) (set-add v (list (add1 use-beg)
                                            (add1 use-end))))
                    (set)))

    (define/override (syncheck:add-mouse-over-status _text beg end status)
      (when (valid-beg/end? beg end)
        ;; Avoid silly "imported from “\"file.rkt\"”"
        (define cleansed (regexp-replace* #px"[“””]" status ""))
        (set-add! infos (item 'info beg end
                              cleansed))

        ;; Local completions candidates. When a definition isn't yet
        ;; used, there will be no syncheck:add-arrow annotation
        ;; because drracket doesn't need to draw an arrow from
        ;; something to nothing. There _will_ however be a "no bound
        ;; occurrences" mouseover. Although it's hacky to match on a
        ;; string like that, it's the best way to get _all_ local
        ;; completion candidates. It's the same reason why we go to
        ;; the work in imported-completions to find _everything_
        ;; imported that _could_ be used.
        (when (or (equal? status "no bound occurrences")
                  (regexp-match? #px"^\\d+ bound occurrences?$" status))
          (set-add! locals (substring code-str beg end)))))

    #;(define/override (syncheck:add-background-color _text start fin color) (void))

    (define/override (syncheck:add-jump-to-definition text beg end id-sym path submods)
      ;; - drracket/check-syntax only reports the file, not the
      ;;   position within. We can find that using our
      ;;   def-in-file.
      ;;
      ;; - drracket/check-syntax uses identifier-binding which
      ;;   isn't smart about contracting and/or renaming
      ;;   provides. As a result, the value of the id here can
      ;;   be wrong. e.g. For "make-traversal" it will report
      ;;   "provide/contract-id-make-traversal.1". It's good to
      ;;   try both ids with def-in-file.
      ;;
      ;; However, calling def-in-file here/now for all jumps
      ;; would be quite slow. Futhermore, a user might not
      ;; actually use the jumps -- maybe not any, probably not
      ;; most, certainly not all.
      ;;
      ;; Sound like a job for a thunk, e.g. racket/promise
      ;; delay/force? We can't marshal a promise between Racket
      ;; back end and Emacs front end. We can do the moral
      ;; equivalent: Simply return the info that the front end
      ;; should give to the "def/drr" command if/as/when needed.
      (when (file-exists? path)
        (define drracket-id-str (symbol->string id-sym))
        (set-add! infos
                  (item 'external-def beg end
                        (path->string path)
                        submods
                        (if (equal? drracket-id-str text)
                            (list drracket-id-str)
                            (list drracket-id-str text))))))

    #;(define/override (syncheck:add-definition-target _text start-pos end-pos id mods) (void))
    #;(define/override (syncheck:add-require-open-menu _text start-pos end-pos file) (void))

    (define/override (syncheck:add-docs-menu _text beg end _sym _label path _anchor anchor-text)
      (set-add! infos (item 'doc beg end
                            (path->string path)
                            anchor-text)))

    #;(define/override (syncheck:add-id-set to-be-renamed/poss dup-name?) (void))

    (define/override (syncheck:add-unused-require _req-src beg end)
      (set-add! infos (item 'unused-require beg end)))

    (define/public (get-annotations)
      ;; Convert ht-defs/uses to a list of defs, each of whose uses
      ;; are sorted by positions.
      (define defs/uses
        (with-time/log 'defs/uses
          (for/list ([(def uses) (in-hash ht-defs/uses)])
            (match-define (list sym req def-beg def-end) def)
            (list 'def/uses
                  def-beg def-end
                  req sym
                  (sort (set->list uses) < #:key car)))))
      ;; annotations = infos + defs/uses, converted to a list sorted
      ;; by positions.
      (sort (append (set->list infos)
                    defs/uses)
            < #:key cadr))

    (define/public (get-locals)
      locals)

    (super-new)))

;; Typed Racket can report multiple errors. The protocol: it calls
;; error-display-handler for each one. There is a final, actual
;; exn:fail:syntax raised, but it's not useful for us: Although its
;; srclocs correspond to the locations, its message is just a summary.
;; Here we collect each message and location in a parameter, and when
;; the final summary exn is raised, we ignore it and use these. Note
;; that Typed Racket is the only such example I'm aware of, but if
;; something else wanted to report multiple errors, and it used a
;; similar approach, we'd handle it here, too.
(define pre-exn-errors (make-parameter '()))
(define ((our-error-display-handler path-str code-str) msg exn)
  (when (and (exn:fail:syntax? exn)
             (exn:srclocs? exn))
    (pre-exn-errors (append (pre-exn-errors)
                            (exn->errors path-str code-str exn)))))

(define ((handle-fail path-str code-str) e)
  (cons
   'check-syntax-errors
   (cond
     ;; Multiple errors. See comment above.
     [(not (null? (pre-exn-errors)))
      (pre-exn-errors)]
     ;; The intended use of exn:srclocs is a _single_ error, with zero
     ;; or more locations from least to most specific -- not multiple
     ;; errors.
     [(exn:srclocs? e)
      (exn->errors path-str code-str e)]
     ;; A single error with no srcloc at all. Although probably
     ;; unlikely with exn:fail:syntax during expansion (as opposed to
     ;; runtime errors) do handle it:
     [else
      (default-errors path-str code-str e)])))

(define (exn->errors path-str code-str e)
  (define (->path-string v)
    (match v
      [(? path-string? v) v]
      [(? path? v)        (path->string v)]))
  (match ((exn:srclocs-accessor e) e)
    [(list)
     (match e
       ;; exn:fail:syntax and exn:fail:read can have empty srclocs
       ;; list -- but additional struct member has list of syntaxes
       ;; from least to most specific. Use the most-specific, only.
       [(or (exn:fail:syntax msg _marks (list _ ... stx))
            (exn:fail:read   msg _marks (list _ ... stx)))
        #:when (not (exn:fail:read:eof? e))
        (define pos  (syntax-position stx))
        (define span (syntax-span stx))
        (cond [(and pos span)
               (list
                (list 'error
                      (->path-string (or (syntax-source stx) path-str))
                      pos
                      (+ pos span)
                      msg))]
              [else (default-errors path-str code-str e)])]
       [_ (default-errors path-str code-str e)])]
    [(list _ ... (? srcloc? most-specific))
     (match-define (srcloc path _ _ pos span) most-specific)
     (list
      (list 'error
            (->path-string path)
            pos
            (+ pos span)
            (exn-message e)))]
    [_ (default-errors path-str code-str e)]))

(define (default-errors path-str code-str e)
  ;; As a fallback, here, we extract position from the exn-message.
  ;; Unfortunately that's line:col and we need to return beg:end.
  (define pos (exn-message->pos code-str (exn-message e)))
  (list
   (list 'error
         path-str
         pos
         (add1 pos)
         (exn-message e))))

(define (exn-message->pos code-str msg)
  (match msg
    [(pregexp "^.+?:(\\d+)[:.](\\d+): "
              (list _ (app string->number line) (app string->number col)))
     (define in (open-input-string code-str))
     (port-count-lines! in)
     (let loop ([n 1])
       (cond [(= n line)                   (+ 1 (file-position in) col)]
             [(eof-object? (read-line in)) 1]
             [else                         (loop (add1 n))]))]
    [_ 1]))

(module+ test
  (check-equal?
   (exn-message->pos "12\n4567\n9"
                     ;      ^
                     "/path/to/foo.rkt:2:2: some problem")
   6)
  (check-equal?
   (exn-message->pos "012\n4567\n9"
                     ;       ^
                     "/path/to/foo.rkt:999:2: some problem")
   1))

(module+ example
  (require racket/file)
  (define (check-file path)
    (time (do-check-syntax path (file->string path))))
  (check-file (path->string (syntax-source #'here))))

(module+ test
  (require racket/file)
  (define (check-this-file path)
    (check-not-exn
     (λ ()
       (time (void (do-check-syntax path (file->string path)))))))
  (check-this-file (path->string (syntax-source #'here)))
  ;; Again to exercise and test cache
  (check-this-file (path->string (syntax-source #'here))))