1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776
|
; Part of Scheme 48 1.9. See file COPYING for notices and license.
; Authors: Richard Kelsey, Jonathan Rees, Martin Gasbichler, Mike Sperber
; Optimizations are marked with +++, and may be flushed if desired.
(define (compile-expression node depth frame cont)
(compile node depth frame cont))
; Main dispatch for compiling a single expression.
(define (compile node depth frame cont)
(let ((node (type-check node)))
((operator-table-ref compilators (node-operator-id node))
node
depth
frame
cont)))
; Specialists
(define compilators
(make-operator-table
(lambda (node depth frame cont)
(generate-trap depth
frame
cont
"not valid in expression context"
(schemify node)))))
(define (define-compilator name type proc)
(operator-define! compilators name type proc))
;----------------------------------------------------------------
(define-compilator 'literal 'leaf
(lambda (node depth frame cont)
(compile-constant (node-form node) depth frame cont)))
(define-compilator 'quote syntax-type
(lambda (node depth frame cont)
(compile-constant (cadr (node-form node)) depth frame cont)))
(define (compile-constant obj depth frame cont)
(deliver-constant-value (cond ((eq? obj #f)
;; +++ hack for bootstrap from Schemes that don't
;; distinguish #f/()
(instruction (enum op false)))
((small-integer? obj)
(integer-literal-instruction obj))
(else
(stack-indirect-instruction
(template-offset frame depth)
(literal->index frame obj))))
cont))
(define (small-integer? obj)
(and (integer? obj)
(exact? obj)
(<= 0 (+ obj 128))
(< (+ obj 128) byte-limit)))
; PreScheme does not have signed bytes so we bias OBJ
(define (integer-literal-instruction obj)
(instruction (enum op integer-literal)
(+ obj 128)))
(define-compilator 'unspecific (proc () unspecific-type)
(lambda (node depth frame cont)
(deliver-constant-value (instruction (enum op unspecific))
cont)))
(define-compilator 'unassigned (proc () unspecific-type)
(lambda (node depth frame cont)
(deliver-constant-value (instruction (enum op unassigned))
cont)))
(define (deliver-constant-value segment cont)
(deliver-value (if (ignore-values-cont? cont)
empty-segment
segment)
cont))
;----------------------------------------------------------------
; Variable reference
(define-compilator 'name 'leaf
(lambda (node depth frame cont)
(let* ((binding (name-node-binding node))
(name (node-form node)))
(deliver-value
(if (pair? binding)
(compile-local-name node name binding depth)
(let ((offset (template-offset frame depth))
(index (binding->index frame binding name #f)))
(instruction (enum op global)
(high-byte offset)
(low-byte offset)
(high-byte index)
(low-byte index))))
cont))))
(define (compile-local-name node name binding depth)
(let ((stack-offset (index->offset (car binding) depth))
(rest (cdr binding)))
(cond ((null? rest) ; in this frame
(stack-ref-instruction stack-offset))
((null? (cdr rest))
(stack-indirect-instruction stack-offset (car rest)))
(else
(assertion-violation 'compile-local-name "variable has too many indirections"
name binding)))))
;----------------------------------------------------------------
; Hacked versions of the above for peephole optimization of pushes.
; This tries to compile NODE with an implicit push instruction preceeding
; (if PRE?) or following (if not PRE?). The instructions with implicit
; pushes are:
; push-false
; push+stack-ref
; stack-ref+push
; push+stack-indirect
; stack-indirect+push
; This codes finds the cases where literals or lexical references can be
; compiled into one of these.
(define (maybe-compile-with-push node depth frame pre?)
(cond ((literal-node? node)
(constant-with-push (node-form node) depth frame pre?))
((quote-node? node)
(constant-with-push (cadr (node-form node)) depth frame pre?))
((name-node? node)
(let ((binding (name-node-binding node)))
(if (and (pair? binding)
(not (node-ref node 'check-unassigned)))
(lexical-ref-with-push binding depth pre?)
#f)))
(else
#f)))
(define (constant-with-push obj depth frame pre?)
(cond ((eq? obj #f)
(if pre?
#f
(instruction (enum op push-false))))
((small-integer? obj)
; PreScheme does not have signed bytes so we bias OBJ
(instruction (if pre?
(enum op push+integer-literal)
(enum op integer-literal+push))
(+ obj 128)))
(else
(push+stack-indirect-instruction (template-offset frame depth)
(literal->index frame obj)
pre?))))
(define (lexical-ref-with-push binding depth pre?)
(let ((stack-offset (index->offset (car binding) depth))
(rest (cdr binding)))
(cond ((null? rest) ; in this frame
(push+stack-ref-instruction stack-offset pre?))
((null? (cdr rest))
(push+stack-indirect-instruction stack-offset (car rest) pre?))
(else
#f))))
(define (push+stack-ref-instruction index pre?)
(if (< index byte-limit)
(instruction (if pre?
(enum op push+stack-ref)
(enum op stack-ref+push))
index)
#f))
(define (push+stack-indirect-instruction index-in-stack index pre?)
(if (and (< index byte-limit)
(< index-in-stack byte-limit))
(instruction (if pre?
(enum op push+stack-indirect)
(enum op stack-indirect+push))
index-in-stack
index)
#f))
;----------------------------------------------------------------
; Assignment
(define-compilator 'set! syntax-type
(lambda (node depth frame cont)
(let* ((exp (node-form node))
(lhs-node (cadr exp))
(name (node-form lhs-node))
(binding (name-node-binding lhs-node)))
(sequentially
(compile (caddr exp) depth frame (named-cont name))
(deliver-value
(if (pair? binding)
(let ((stack-offset (index->offset (car binding) depth))
(rest (cdr binding)))
(if (null? rest) ; in this frame
(stack-set!-instruction stack-offset)
(assertion-violation 'set! "SET! on a closed-over variable" name)))
(let ((offset (template-offset frame depth))
(index (binding->index frame
binding
name
#t)))
(instruction (enum op set-global!)
(high-byte offset)
(low-byte offset)
(high-byte index)
(low-byte index))))
cont)))))
;----------------------------------------------------------------
; IF and BEGIN
(define-compilator 'if syntax-type
(lambda (node depth frame cont)
(let ((exp (node-form node))
(alt-label (make-label))
(join-label (make-label)))
(sequentially
;; Test
(compile (cadr exp) depth frame (fall-through-cont node 1))
(instruction-using-label (enum op jump-if-false) alt-label)
;; Consequent
(compile (caddr exp) depth frame cont)
(if (fall-through-cont? cont)
(instruction-using-label (enum op jump) join-label)
empty-segment)
;; Alternate
(attach-label alt-label
(compile (cadddr exp) depth frame cont))
(attach-label join-label
empty-segment)))))
(define-compilator 'begin syntax-type
(lambda (node depth frame cont)
(let ((exp-list (cdr (node-form node))))
(if (null? exp-list)
(generate-trap depth frame cont "null begin")
(let ((dummy
(make-node operator/begin ;For debugging database
`(begin ,@exp-list))))
(let loop ((exp-list exp-list) (i 1))
(if (null? (cdr exp-list))
(compile (car exp-list) depth frame cont)
(sequentially
(compile (car exp-list)
depth
frame
(ignore-values-cont dummy i))
(loop (cdr exp-list) (+ i 1))))))))))
;----------------------------------------------------------------
; Calls
(define (compile-call node depth frame cont)
(if (node-ref node 'type-error)
(compile-unknown-call node depth frame cont)
(let ((proc-node (car (node-form node))))
(cond ((name-node? proc-node)
(compile-name-call node proc-node depth frame cont))
((and (lambda-node? proc-node)
(not (n-ary? (cadr (node-form proc-node)))))
(compile-redex proc-node (cdr (node-form node))
depth
frame
cont))
((and (literal-node? proc-node)
(primop? (node-form proc-node)))
(let ((primop (node-form proc-node)))
(if (primop-compilator primop)
((primop-compilator primop) node depth frame cont)
(assertion-violation 'compile-call
"compiler bug: primop has no compilator"
primop
(schemify node)))))
(else
(compile-unknown-call node depth frame cont))))))
(define-compilator 'call 'internal compile-call)
(define (compile-name-call node proc-node depth frame cont)
(let ((binding (name-node-binding proc-node)))
(if (binding? binding)
(let ((static (binding-static binding)))
(cond ((primop? static)
(if (primop-compilator static)
((primop-compilator static) node depth frame cont)
(compile-unknown-call node depth frame cont)))
((transform? static)
(let* ((form (node-form node))
(new (apply-inline-transform static
form
(node-form proc-node))))
(if (eq? new form)
(compile-unknown-call node depth frame cont)
(compile new depth frame cont))))
(else
(compile-unknown-call node depth frame cont))))
(compile-unknown-call node depth frame cont))))
; Compile a call to a computed procedure.
(define (compile-unknown-call node depth frame cont)
(receive (before depth label after)
(maybe-push-continuation depth frame cont node)
(let* ((exp (node-form node))
(nargs (length (cdr exp))))
(sequentially before
(push-arguments node depth frame)
(compile (car exp)
(+ depth nargs)
frame
(fall-through-cont node 0))
(call-instruction nargs (+ depth nargs) label)
after))))
; A redex is a call of the form ((lambda (x1 ... xn) body ...) e1 ... en).
(define (compile-redex proc-node args depth frame cont)
(let* ((proc-exp (node-form proc-node))
(formals (cadr proc-exp))
(body (caddr proc-exp)))
(cond ((not (= (length formals)
(length args)))
(generate-trap depth
frame
cont
"wrong number of arguments"
(cons (schemify proc-node)
(map schemify args))))
((null? formals)
(compile body depth frame cont)) ;+++
(else
(let* ((nargs (length args))
(body-depth (+ depth nargs)))
(set-frame-locations! formals body-depth)
(sequentially
(push-all-with-names args formals depth frame)
(compile-inline-body nargs
(map name-node->symbol formals)
body
body-depth
frame
cont)))))))
(define (compile-inline-body nargs formals body depth frame cont)
(sequentially
(note-environment
formals
(- depth nargs)
(compile body depth frame cont))
(if (return-cont? cont)
empty-segment
(deliver-value (instruction (enum op pop-n)
(high-byte nargs)
(low-byte nargs))
cont))))
;----------------------------------------------------------------
; (PURE-LETREC ((<var> <val>) ...) (<free var> ...) <body>)
; These are LETREC's where the values are all LAMBDA's. They are produced by
; opt/flatten.scm.
(define-compilator 'pure-letrec syntax-type
(lambda (node depth frame cont)
(let* ((exp (node-form node))
(specs (cadr exp))
(free-vars (caddr exp))
(body (cadddr exp))
(count (length specs))
(old-locations (map name-node-binding free-vars)))
(receive (env-code ignore-free-vars-in-order)
(compile-recursive-environment free-vars
depth
(template-offset frame depth)
(letrec-template-maker specs frame))
(for-each (lambda (node location)
(node-set! node 'binding location))
free-vars
old-locations)
(set-lexical-offsets! (map car specs) depth)
(depth-check! frame (+ depth 1))
(sequentially
env-code
(instruction (enum op push))
(compile-inline-body 1
(list (map name-node->symbol
(append (map car specs)
free-vars)))
body
(+ depth 1)
frame
cont))))))
; After getting the free variable list (to pass to NOTE-ENVIRONMENT) this
; compiles the values in SPECS, all of which are lambdas. It returns the
; template indexes of the resulting templates.
(define (letrec-template-maker specs frame)
(lambda (free-vars-in-order)
(let ((all-vars (append (map car specs)
free-vars-in-order)))
(map (lambda (spec)
(receive (proc-code proc-frame)
(compile-lambda (unflatten-form (cadr spec))
all-vars
(node-form (car spec))
#f
frame)
(literal->index frame
(segment->template proc-code proc-frame))))
specs))))
;----------------------------------------------------------------
; We don't pass the incremented depth to MAKE-RETURN-POINT because the
; return-pointer is not included in a continuation's size.
;
; Returns before-segment new-depth label after-segment.
;
; In all of these NODE is the expression whose value will be returned to the
; continuation. It is saved for debugging assistance.
(define (maybe-push-continuation depth frame cont node)
(if (return-cont? cont)
(values empty-segment depth #f empty-segment)
(push-continuation depth frame cont node)))
(define (push-continuation depth frame cont node)
(if (return-cont? cont)
(assertion-violation 'push-continuation "making a return point in tail position" cont))
(let ((protocol (continuation-protocol (if (ignore-values-cont? cont)
0
1)
(if (ignore-values-cont? cont)
#t
#f))))
(really-push-continuation depth frame protocol node cont)))
(define (push-continuation-no-protocol depth frame node cont)
(really-push-continuation depth frame empty-segment node cont))
(define (really-push-continuation depth frame protocol node cont)
(depth-check! frame (+ depth 1))
(let ((label (make-label))
(protocol (if (keep-source-code?)
(note-source-code (fixup-source node
(cont-source-info cont))
protocol
frame)
protocol)))
(values (instruction (enum op push-false))
(+ depth 1)
label
(sequentially (continuation-data #f depth (template-offset frame depth))
(attach-label label protocol)))))
(define (fixup-source node destination)
;; Abbreviate this somehow?
(if node
(if (pair? destination)
(cons (schemify node)
(cons (car destination)
(schemify (cdr destination))))
(list (schemify node)))
#f))
;----------------------------------------------------------------
; Pushing arguments.
;
; This is a mess because we try to merge push instructions with other common
; ones. There are three entry points:
(define (push-arguments node depth frame)
(let ((args (cdr (node-form node))))
(if (null? args)
empty-segment
(really-push-arguments args depth frame node #t))))
(define (push-all-but-last nodes depth frame debug-info)
(really-push-arguments nodes depth frame debug-info #f))
(define (push-all-with-names nodes names depth frame)
(really-push-arguments nodes depth frame names #t))
(define (push-argument node index depth frame)
(depth-check! frame (+ depth 1))
(receive (code pushed?)
(compile-argument (list-ref (node-form node) (+ index 1))
depth
frame
node
(+ index 1)
#f
#t)
(if pushed?
code
(sequentially code push-instruction))))
; The main loop.
(define (really-push-arguments nodes depth frame debug-info push-last?)
(let recur ((args nodes) (i 1) (pre-push? #f))
(receive (arg-code pushed?)
(compile-argument (car args) (+ depth (- i 1)) frame debug-info i
pre-push?
(if (null? (cdr args))
push-last?
#t))
(cond ((null? (cdr args))
(depth-check! frame (+ depth (if push-last? i (- i 1))))
(if (and push-last? (not pushed?))
(sequentially arg-code push-instruction)
arg-code))
(else
(sequentially arg-code
(recur (cdr args) (+ i 1) (not pushed?))))))))
(define (compile-argument node depth frame debug-info index before? after?)
(cond ((and before? ;+++
(maybe-compile-with-push node depth frame #t))
=> (lambda (code)
(values code #f)))
((and after? ;+++
(maybe-compile-with-push node depth frame #f))
=> (lambda (code)
(values (pre-push code before?)
#t)))
(else
(values (pre-push (compile node
depth
frame
(if (pair? debug-info)
(named-cont (node-form (car debug-info)))
(fall-through-cont debug-info index)))
before?)
#f))))
(define (pre-push code do-it?)
(if do-it?
(sequentially push-instruction code)
code))
(define push-instruction
(instruction (enum op push)))
;----------------------------------------------------------------
; We have two sizes of these because the big size is very rare and
; signficantly slower (because the argument count cannot be encoded in
; the protocol).
(define (call-instruction nargs depth label)
(if label
(if (> nargs maximum-stack-args) ;+++
(instruction-using-label (enum op big-call)
label
(high-byte nargs)
(low-byte nargs))
(instruction-using-label (enum op call)
label
nargs))
(if (> nargs maximum-stack-args) ;+++
(instruction (enum op big-call)
0
0
(high-byte nargs)
(low-byte nargs))
(instruction (enum op tail-call)
nargs
(high-byte depth)
(low-byte depth)))))
(define (stack-ref-instruction index)
(if (>= index byte-limit) ;+++
(instruction (enum op big-stack-ref)
(high-byte index)
(low-byte index))
(instruction (enum op stack-ref)
index)))
(define (stack-set!-instruction index)
(if (>= index byte-limit) ;+++
(instruction (enum op big-stack-set!)
(high-byte index)
(low-byte index))
(instruction (enum op stack-set!)
index)))
(define (stack-indirect-instruction index-in-stack index)
(if (and (< index byte-limit) ;+++
(< index-in-stack byte-limit))
(instruction (enum op stack-indirect)
index-in-stack
index)
(instruction (enum op big-stack-indirect)
(high-byte index-in-stack)
(low-byte index-in-stack)
(high-byte index)
(low-byte index))))
;----------------------------------------------------------------
; Compile-time continuations
;
; A compile-time continuation is a pair (kind . source-info).
; Kind is one of the following:
; 'return - invoke the current full continuation.
; 'fall-through - fall through to subsequent instructions.
; 'ignore-values - ignore values, then fall through.
; 'accept-values - pass values to continuation
; Source-info is one of:
; #f - we don't know anything
; symbol - value delivered to subsequent instructions will be assigned to
; a variable with this name. If the value being assigned is a lambda, we
; can give that lambda that name.
; (i . node) - the value being computed is the i'th subexpression of the node.
(define (make-cont kind source-info) (cons kind source-info))
(define cont-kind car)
(define cont-source-info cdr)
; We could probably be able to optimize jumps to jumps.
;(define (make-jump-cont label cont)
; (if (fall-through-cont? cont)
; (make-cont label (cont-name cont))
; cont))
(define (return-cont name)
(make-cont 'return name))
(define (return-cont? cont)
(eq? (cont-kind cont) 'return))
; Fall through into next instruction while compiling the I'th part of NODE.
(define (fall-through-cont node i)
(make-cont 'fall-through (cons i node)))
(define (plain-fall-through-cont)
(make-cont 'fall-through #f))
(define (fall-through-cont? cont)
(not (return-cont? cont)))
; Ignore return value, then fall through
(define ignore-values-segment
(instruction ignore-values-protocol))
(define (ignore-values-cont node i)
(make-cont 'ignore-values (cons i node)))
(define (ignore-values-cont? cont)
(eq? (cont-kind cont) 'ignore-values))
(define (accept-values-cont node i)
(make-cont 'accept-values (cons i node)))
(define (accept-values-cont? cont)
(eq? (cont-kind cont) 'accept-values))
; Value is in *val*; deliver it to its continuation.
(define (deliver-value segment cont)
(if (return-cont? cont)
(sequentially segment
(instruction (enum op return)))
segment)) ; just fall through to next instruction
; For putting names to lambda expressions:
(define (named-cont name)
(make-cont 'fall-through name))
(define (cont-name cont)
(if (pair? (cont-source-info cont))
#f
(cont-source-info cont)))
;----------------------------------------------------------------
; Utilities
; Find lookup result that was cached by classifier
; The binding property is either a location, a 1- or 2-element list with
; stack index and template index, or 'unbound
(define (name-node-binding node)
(or (node-ref node 'binding)
(node-form node)))
; Produce something for source code that contains a compile-time error.
(define (generate-trap depth frame cont . stuff)
(apply warning 'generate-trap stuff)
(sequentially
(stack-indirect-instruction (template-offset frame depth)
(literal->index frame (cons 'error stuff)))
(deliver-value (instruction (enum op trap))
cont)))
;----------------------------------------------------------------
; Type checking. This gets called on all nodes.
(define (type-check node)
(if *type-check?*
(let ((form (node-form node)))
(if (pair? form)
(let ((proc-node (car form)))
(if (node? proc-node)
(let ((proc-type (node-type proc-node)))
(cond ((procedure-type? proc-type)
(if (restrictive? proc-type)
(let* ((args (cdr form))
(args-type (make-some-values-type
(map (lambda (arg)
(meet-type
(node-type arg)
value-type))
args)))
(node (make-similar-node node
(cons proc-node
args))))
(if (not (meet? args-type
(procedure-type-domain proc-type)))
(diagnose-call-error node proc-type))
node)
node))
((not (meet? proc-type any-procedure-type))
;; Could also check args for one-valuedness.
(let ((message "non-procedure in operator position"))
(warning 'type-check
message
(schemify node)
`(procedure: ,proc-type))
(node-set! node 'type-error message))
node)
(else node)))
node))
node))
node))
(define (set-type-check?! check?)
(set! *type-check?* check?))
(define *type-check?* #t)
(define (diagnose-call-error node proc-type)
(let ((message
(cond ((not (fixed-arity-procedure-type? proc-type))
"invalid arguments")
((= (procedure-type-arity proc-type)
(length (cdr (node-form node))))
"argument type error")
(else
"wrong number of arguments"))))
(warning 'diagnose-call-error
message
(schemify node)
`(procedure wants:
,(rail-type->sexp (procedure-type-domain proc-type)
#f))
`(arguments are: ,(map (lambda (arg)
(type->sexp (node-type arg) #t))
(cdr (node-form node)))))
(node-set! node 'type-error message)))
; Type system loophole
(define-compilator 'loophole syntax-type
(lambda (node depth frame cont)
(compile (caddr (node-form node)) depth frame cont)))
|