File: tuning.lisp

package info (click to toggle)
acl2 8.6%2Bdfsg-2
  • links: PTS
  • area: main
  • in suites: trixie
  • size: 1,111,420 kB
  • sloc: lisp: 17,818,294; java: 125,359; python: 28,122; javascript: 23,458; cpp: 18,851; ansic: 11,569; perl: 7,678; xml: 5,591; sh: 3,976; makefile: 3,833; ruby: 2,633; yacc: 1,126; ml: 763; awk: 295; csh: 233; lex: 197; php: 178; tcl: 49; asm: 23; haskell: 17
file content (42 lines) | stat: -rw-r--r-- 1,510 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
(in-package 3bz)

;;; some tuning parameters, and functions used in #+#.(...) to control
;;; features used by code

;;; deflate code tries to read/write/copy 64bits at a time, and uses
;;; ub64 buffer for bits when doing non-octet-unaligned reads, but
;;; that's slow if ub64 is a bignum, so this is used to switch to ub32
;;; where possible
(defun use-ub64 ()
  '(:or)
  ;; on mezzano, ub64 is better on some files, worse on others, so leaving off for now
  #+ (or (and 64-bit sbcl))
  '(:and))

;;; similarly, adler32 checksum accumulates as many bytes as possible
;;; before doing mod, so we can either use :ub64, :ub32 or :fixnum
;;; versions of adler32 code depending on which is fastest
(defun use-adler32 (version)
  (if (eql version
           ;; ub64 is fastest on 64bit sbcl, and seems better on mezzano too now
           #+ (or mezzano (and sbcl x86-64))
           :ub64
           ;; for now, just using fixnum elsewhere until there are
           ;; proper benchmarks. not sure if ub32 is faster than
           ;; fixnum anywhere, or if fixnum is good enough
           #- (or mezzano abcl (and sbcl x86-64))
           :fixnum
           #+ abcl
           :ub32
           )
      '(:and)
      '(:or)))
;;; adler32 checksum is unrolled a bit to reduce loop overhead, this
;;; specifies how many iterations to unroll
;; todo: set this for more combinations of cpu/implementation once
;; there are benchmarks
(defconstant +adler32-unroll+
  #+mezzano 16
  #+sbcl 32
  #- (or sbcl mezzano) 8)