-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathwinnowing.mli
69 lines (57 loc) · 2.75 KB
/
winnowing.mli
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
(* custom data structure representing a bounded queue which also keeps track
* of its current size
* and the total number of times enqueue has been called *)
module type BoundedQueueWithCounter = sig
type 'a t
(* [empty n] returns an empty queue with capacity n *)
val empty : int -> 'a t
(* [create n i] returns a full queue with capacity n,
* with every element initialized to i *)
val create : int -> 'a -> 'a t
(* [is_empty q] checks if q is empty and returns a boolean *)
val is_empty : 'a t -> bool
(* [is_full q] checks if q is full and returns a boolean *)
val is_full : 'a t -> bool
(* [size q] returns the number of elements currently in q *)
val size : 'a t -> int
(* [enqueue v q] returns a queue that has the contents of q with the
* value v enqueued at the tail
* if q is full, then the first element will be dequeued before v is
* enqueued *)
val enqueue : 'a -> 'a t -> 'a t
(* [dequeue q] dequeues the first element (head) of q and returns a tuple
* of the element and the updated queue the dequeued element is stored as
* an option
* if q is empty then the first value of the tuple will be None*)
val dequeue : 'a t -> 'a option * 'a t
(* [count q] returns the number of elements that have been enqueued
* (including ones that are no longer in the queue) *)
val count : 'a t -> int
(* [fold f init q] folds [f] over a list of the elements in [q] from
* the head to the tail with initial value [init] *)
val fold : ('b -> 'a -> 'b) -> 'b -> 'a t -> 'b
(* [to_list q] returns a list representation of the elements of q in order,
* with the first element being the head and the last element being the tail
*)
val to_list: 'a t -> 'a list
end
(* an implementation of BoundedQueueWithCounter using a record type and using
* two lists to store data. The first list stores the front of the queue,
* the second list stores the back of the queue in reverse order.
*
* AF: the elements of the queue is stored in the [data] field, the current
* size stored in [size], the maximum size stored in [maxsize], and number of
* times an element has been enqueued stored in [count]
*
* RI: [size] <= [maxsize], [size],[maxsize],[count] cannot be negative, [size]
* is sum of the lengths of both lists in [data], the head of the first list
* in data is the head of the queue, the head of the second list is the tail
* of the queue
*)
module Window : BoundedQueueWithCounter
(* [winnow w h] applies the winnowing algorithm for a list of hashes [h] with
* window size [w] returns: a list of (v,p) tuples where v is a hash value and
* p is the position in the original input the (v,p) list is not guaranteed to
* be in any particular order requires: [w] is a positive integer
*)
val winnow: int -> int list -> (int * int) list