File: hashTable.c

package info (click to toggle)
python-deeptoolsintervals 0.1.9-3
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, forky, sid, trixie
  • size: 304 kB
  • sloc: ansic: 2,317; python: 596; sh: 12; makefile: 5
file content (160 lines) | stat: -rw-r--r-- 3,942 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include "murmur3.h"
#include "gtf.h"

uint64_t hashString(char *s) {
    int len = strlen(s);
    uint64_t hash_val[2];
    uint32_t seed = 0xAAAAAAAA;
#if UINTPTR_MAX == 0xffffffff
    MurmurHash3_x86_128((void *) s, len, seed, (void *) &hash_val);
#else
    MurmurHash3_x64_128((void *) s, len, seed, (void *) &hash_val);
#endif
    return hash_val[0];
}

hashTable *initHT(uint64_t size) {
    hashTable *ht = calloc(1, sizeof(hashTable));
    assert(ht);

    ht->elements = calloc(size, sizeof(hashTableElement*));
    assert(ht->elements);
    ht->str = calloc(size, sizeof(char*));
    assert(ht->str);

    ht->m = size;
    return ht;
}

void insertHTelement(hashTable *ht, hashTableElement *e, uint64_t hash) {
    uint64_t i = hash%ht->m;
    hashTableElement *curr = ht->elements[i];
    if(!curr) ht->elements[i] = e;
    else {
        while(curr->next) curr = curr->next;
        curr->next = e;
    }
}

static void rehashElement(hashTable *ht, hashTableElement *e) {
    hashTableElement *next = e->next;
    if(!e) return;
    uint64_t hash = hashString(ht->str[e->val]);
    e->next = NULL;
    insertHTelement(ht, e, hash);
    if(next) rehashElement(ht, next);
}

static void rehashHT(hashTable *ht) {
    int32_t i;
    hashTableElement *e;
    for(i=0; i<ht->l; i++) {
        if(ht->elements[i]) {
            e = ht->elements[i];
            ht->elements[i] = NULL;
            rehashElement(ht, e);
        }
    }
}

static void growHT(hashTable *ht) {
    int i;
    ht->m = ht->l+1;
    kroundup32(ht->m);
    ht->str = realloc(ht->str, ht->m*sizeof(char*));
    assert(ht->str);
    ht->elements = realloc(ht->elements, ht->m*sizeof(hashTableElement*));

    for(i=ht->l; i<ht->m; i++) {
        ht->str[i] = NULL;
        ht->elements[i] = NULL;
    }
    rehashHT(ht);
}

//don't do this if the element's already in the table!
int32_t addHTelement(hashTable *ht, char *s) {
    if(!s) return -1;
    uint64_t hash = hashString(s);
    int32_t val = ht->l++;
    if(ht->l >= ht->m) growHT(ht);
    ht->str[val] = strdup(s);

    hashTableElement *e = calloc(1, sizeof(hashTableElement));
    assert(e);
    e->val = val;
    insertHTelement(ht, e, hash);
    return val;
}

void destroyHTelement(hashTableElement *e) {
    hashTableElement *next = e->next;
    free(e);
    if(next) destroyHTelement(next);
}

void destroyHT(hashTable *ht) {
    int i;

    for(i=0; i<ht->l; i++) free(ht->str[i]);

    for(i=0; i<ht->m; i++) {
        if(ht->elements[i]) destroyHTelement(ht->elements[i]);
    }
    free(ht->elements);
    free(ht->str);
    free(ht);
}

int strExistsHT(hashTable *ht, char *s) {
    if(!s) return 0;
    uint64_t h = hashString(s);
    hashTableElement *curr = ht->elements[h%ht->m];
    while(curr) {
        if(strcmp(ht->str[curr->val], s) == 0) return 1;
        curr = curr->next;
    }
    return 0;
}

//Returns -1 if not present
int32_t str2valHT(hashTable *ht, char *s) {
    if(!s) return -1;
    uint64_t h = hashString(s);
    hashTableElement *curr = ht->elements[h%ht->m];
    while(curr) {
        if(strcmp(ht->str[curr->val], s) == 0) return curr->val;
        curr = curr->next;
    }
    return -1;
}

//Returns NULL on error
char *val2strHT(hashTable *ht, int32_t val) {
    if(val<0) return NULL;
    if(val>=ht->l) return NULL;
    return ht->str[val];
}

int hasAttribute(GTFtree *t, GTFentry *e, char *str) {
    int32_t i, key = str2valHT(t->htAttributes, str);

    for(i=0; i<e->nAttributes; i++) {
        if(e->attrib[i]->key == key) return 1;
    }
    return 0;
}

//Returns NULL if the entry lacks the attribute
char *getAttribute(GTFtree *t, GTFentry *e, char *str) {
    int32_t i, key = str2valHT(t->htAttributes, str);

    for(i=0; i<e->nAttributes; i++) {
        if(e->attrib[i]->key == key) return val2strHT(t->htAttributes, e->attrib[i]->val);
    }
    return NULL;
}