Source file db.ml

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220

open Printf

module Ht = Hashtbl

type filename = string

type position = { off: int;
                  len: int }

type db = { data_fn: filename;
            index_fn: filename;
            data: Unix.file_descr;
            index: (string, position) Ht.t }

module Internal = struct

  let create fn =
    let data_fn = fn in
    let index_fn = fn ^ ".idx" in
    let data =
      Unix.(openfile data_fn [O_RDWR; O_CREAT; O_EXCL] 0o600) in
    (* we just check there is not already an index file *)
    let index_file =
      Unix.(openfile index_fn [O_RDWR; O_CREAT; O_EXCL] 0o600) in
    Unix.close index_file;
    let index = Ht.create 11 in
    { data_fn; index_fn; data; index }

  let open_rw fn =
    let data_fn = fn in
    let index_fn = fn ^ ".idx" in
    let data =
      Unix.(openfile data_fn [O_RDWR] 0o600) in
    let index = Utls.restore index_fn in
    { data_fn; index_fn; data; index }

  let open_ro fn =
    let data_fn = fn in
    let index_fn = fn ^ ".idx" in
    let data =
      Unix.(openfile data_fn [O_RDONLY] 0o600) in
    let index = Utls.restore index_fn in
    { data_fn; index_fn; data; index }

  let dummy () =
    { data_fn = "/dev/null";
      index_fn = "/dev/null.idx";
      data = Unix.(openfile "/dev/null" [O_RDWR] 0o600);
      index = Ht.create 0 }

  let close_simple db =
    Unix.close db.data

  let close_sync_index db =
    Unix.close db.data;
    Utls.save db.index_fn db.index

  let sync db =
    ExtUnix.All.fsync db.data;
    Utls.save db.index_fn db.index

  let destroy db =
    Ht.reset db.index;
    Unix.close db.data;
    Sys.remove db.data_fn;
    Sys.remove db.index_fn

  let mem db k =
    Ht.mem db.index k

  let add db k str =
    (* go to end of data file *)
    let off = Unix.(lseek db.data 0 SEEK_END) in
    let len = String.length str in
    let written = Unix.write_substring db.data str 0 len in
    begin
      if written <> len then
        let err_msg =
          sprintf
            "Db.Internal.add: db: %s k: %s str: %s written: %d len: %d"
            db.data_fn k str written len in
        failwith err_msg
    end;
    Ht.add db.index k { off; len }

  let replace db k str =
    (* go to end of data file *)
    let off = Unix.(lseek db.data 0 SEEK_END) in
    let len = String.length str in
    let written = Unix.write_substring db.data str 0 len in
    begin
      if written <> len then
        let err_msg =
          sprintf
            "Db.Internal.replace: db: %s k: %s str: %s written: %d len: %d"
            db.data_fn k str written len in
        failwith err_msg
    end;
    Ht.replace db.index k { off; len }

  let remove db k =
    (* we just remove it from the index, not from the data file *)
    Ht.remove db.index k

  let raw_read db pos =
    let off = pos.off in
    let len = pos.len in
    let buff = Bytes.create len in
    let off' = Unix.(lseek db.data off SEEK_SET) in
    begin
      if off' <> off then
        let err_msg =
          sprintf "Db.Internal.raw_read: db: %s off: %d len: %d off': %d"
            db.data_fn off len off' in
        failwith err_msg
    end;
    let read = Unix.read db.data buff 0 len in
    begin
      if read <> len then
        let err_msg =
          sprintf "Db.Internal.raw_read: db: %s off: %d len: %d read: %d"
            db.data_fn off len read in
        failwith err_msg
    end;
    Bytes.unsafe_to_string buff

  let find db k =
    let v_addr = Ht.find db.index k in
    raw_read db v_addr

  let iter f db =
    Ht.iter (fun k v ->
        f k (raw_read db v)
      ) db.index

  let fold f db init =
    Ht.fold (fun k v acc ->
        f k (raw_read db v) acc
      ) db.index init

end

module RO = struct

  type t = db

  let open_existing fn =
    Internal.open_ro fn

  let dummy () =
    Internal.dummy ()

  let close db =
    Internal.close_simple db

  let mem db k =
    Internal.mem db k

  let find db k =
    Internal.find db k

  let raw_read db pos =
    Internal.raw_read db pos

  let iter f db =
    Internal.iter f db

  let fold f db init =
    Internal.fold f db init

end

module RW = struct

  type t = db

  let create fn =
    Internal.create fn

  let open_existing fn =
    Internal.open_rw fn

  let dummy () =
    Internal.dummy ()

  let close db =
    Internal.close_sync_index db

  let sync db =
    Internal.sync db

  let destroy db =
    Internal.destroy db

  let mem db k =
    Internal.mem db k

  let add db k str =
    Internal.add db k str

  let replace db k str =
    Internal.replace db k str

  let remove db k =
    Internal.remove db k

  let find db k =
    Internal.find db k

  let raw_read db pos =
    Internal.raw_read db pos

  let iter f db =
    Internal.iter f db

  let fold f db init =
    Internal.fold f db init

end