File: tuning.lisp

package info (click to toggle)
acl2 8.5dfsg-5
  • links: PTS
  • area: main
  • in suites: bookworm
  • size: 991,452 kB
  • sloc: lisp: 15,567,759; javascript: 22,820; cpp: 13,929; ansic: 12,092; perl: 7,150; java: 4,405; xml: 3,884; makefile: 3,507; sh: 3,187; ruby: 2,633; ml: 763; python: 746; yacc: 723; awk: 295; csh: 186; php: 171; lex: 154; tcl: 49; asm: 23; haskell: 17
file content (42 lines) | stat: -rw-r--r-- 1,510 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
(in-package 3bz)

;;; some tuning parameters, and functions used in #+#.(...) to control
;;; features used by code

;;; deflate code tries to read/write/copy 64bits at a time, and uses
;;; ub64 buffer for bits when doing non-octet-unaligned reads, but
;;; that's slow if ub64 is a bignum, so this is used to switch to ub32
;;; where possible
(defun use-ub64 ()
  '(:or)
  ;; on mezzano, ub64 is better on some files, worse on others, so leaving off for now
  #+ (or (and 64-bit sbcl))
  '(:and))

;;; similarly, adler32 checksum accumulates as many bytes as possible
;;; before doing mod, so we can either use :ub64, :ub32 or :fixnum
;;; versions of adler32 code depending on which is fastest
(defun use-adler32 (version)
  (if (eql version
           ;; ub64 is fastest on 64bit sbcl, and seems better on mezzano too now
           #+ (or mezzano (and sbcl x86-64))
           :ub64
           ;; for now, just using fixnum elsewhere until there are
           ;; proper benchmarks. not sure if ub32 is faster than
           ;; fixnum anywhere, or if fixnum is good enough
           #- (or mezzano abcl (and sbcl x86-64))
           :fixnum
           #+ abcl
           :ub32
           )
      '(:and)
      '(:or)))
;;; adler32 checksum is unrolled a bit to reduce loop overhead, this
;;; specifies how many iterations to unroll
;; todo: set this for more combinations of cpu/implementation once
;; there are benchmarks
(defconstant +adler32-unroll+
  #+mezzano 16
  #+sbcl 32
  #- (or sbcl mezzano) 8)