File: encode.go

package info (click to toggle)
pk4 5
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, buster
  • size: 1,016 kB
  • sloc: sh: 146; makefile: 7
file content (115 lines) | stat: -rw-r--r-- 2,848 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
package index

import (
	"encoding/binary"
	"fmt"
	"io"
	"sort"
)

type countingWriter struct {
	offset uint32
	w      io.Writer
}

func (cw *countingWriter) Write(p []byte) (n int, err error) {
	n, err = cw.w.Write(p)
	cw.offset += uint32(n)
	return n, err
}

func encode(w io.Writer, idx map[string]string) error {
	cw := countingWriter{w: w}
	w = io.Writer(&cw)

	vals := make([]string, 0, len(idx))
	for _, val := range idx {
		vals = append(vals, val)
	}
	sort.Strings(vals) // for a deterministic index file
	valOffsets := make(map[string]uint32, len(vals))
	for _, val := range vals {
		if _, written := valOffsets[val]; written {
			continue
		}
		valOffsets[val] = cw.offset
		if _, err := fmt.Fprintln(w, val); err != nil {
			return err
		}
	}

	byLength := make(map[int][]string)
	var highest int
	for key := range idx {
		l := len(key)
		byLength[l] = append(byLength[l], key)
		if l > highest {
			highest = l
		}
	}
	// Fill in the gaps so that lookups can seek+read instead of having to
	// binary search through same-length-blocks.
	for i := 1; i <= highest; i++ {
		if _, ok := byLength[i]; ok {
			continue
		}
		byLength[i] = []string(nil)
	}
	var lengths []int
	for l := range byLength {
		lengths = append(lengths, l)
	}
	sort.Ints(lengths) // for a deterministic index file
	sameLenOffsets := make(map[int]uint32)
	// Write same-length-block:
	// <key><offset>
	// <key><offset>
	// …
	// Where each <key> has the same length.
	for _, l := range lengths {
		sameLenOffsets[l] = cw.offset
		keys := byLength[l]
		sort.Strings(keys)
		for _, k := range keys {
			if _, err := w.Write([]byte(k)); err != nil {
				return err
			}
			if err := binary.Write(w, binary.LittleEndian, valOffsets[idx[k]]); err != nil {
				return err
			}
		}
	}

	blockIndexOffset := cw.offset
	// Write block index (position == key length):
	// uint32(<same-len-block-offset>), uint32(<same-len-block-len>)

	// So that the length of the current block can be computed by looking at the
	// offset of the next block:
	sameLenOffsets[lengths[len(lengths)-1]+1] = cw.offset
	for _, l := range lengths {
		blockLen := sameLenOffsets[l+1] - sameLenOffsets[l]
		blockOffset := sameLenOffsets[l]
		if err := binary.Write(w, binary.LittleEndian, BlockLocation{blockOffset, blockLen}); err != nil {
			return err
		}
	}

	return binary.Write(w, binary.LittleEndian, blockIndexOffset)
}

func (index URIs) Encode(w io.Writer) error {
	idx := make(map[string]string, len(index))
	for src, dsc := range index {
		idx[fmt.Sprintf("%s\t%s", src.Package, src.Version)] = fmt.Sprintf("%s\t%d", dsc.URL, dsc.Size)
	}
	return encode(w, idx)
}

func (index Index) Encode(w io.Writer) error {
	idx := make(map[string]string, len(index))
	for key, src := range index {
		idx[key] = fmt.Sprintf("%s\t%s", src.Package, src.Version.String())
	}
	return encode(w, idx)
}