-
Notifications
You must be signed in to change notification settings - Fork 430
/
30-vector.exs
213 lines (184 loc) · 6.04 KB
/
30-vector.exs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
# persistent bit-partitioned vector trie
# http://hypirion.com/musings/understanding-persistent-vector-pt-1 (and part 2)
defmodule Vector do
import Bitwise
@bits 2
@width 1 <<< @bits # 4-way branching
@mask @width - 1
require Record
Record.defrecordp :vec, Vector, size: 0, depth: 0, tree: []
@doc """
Builds a new empty vector.
iex> Vector.new
{Vector, 0, 0, []}
"""
def new do
vec()
end
@doc """
Builds a new vector from the given list.
iex> Vector.new(["tim", "jen"])
{Vector, 2, 1, ["tim", "jen"]}
"""
def new(list) do
depth = round(Float.ceil(length(Integer.to_char_list((length(list) - 1), 2)) / @bits))
vec(size: length(list), depth: depth, tree: tree_from_list(list, depth))
end
@doc """
Get the size of the vector.
iex> v = Vector.new([1, 2, 3])
iex> Vector.size(v)
3
"""
def size(vec(size: size)) do
size
end
@doc """
Gets the value from the vector at the given index.
iex> v = Vector.new(["tim", "jen", "mac", "kai"])
iex> Vector.get(v, 2)
"mac"
"""
def get(vec(depth: depth, tree: tree), index) do
do_get(tree, key(index, depth))
end
@doc """
Puts the value in a vector at the given index.
iex> v = Vector.new
iex> v = Vector.put(v, 0, "tim")
iex> Vector.get(v, 0)
"tim"
"""
def put(vec(size: size, depth: depth, tree: tree), index, value) do
if index > size, do: raise "index too large"
if index == size, do: size = index + 1
# grow tree
if size > depth * @width do
depth = depth + 1
tree = [tree]
end
# attach node
tree = do_put tree, key(index, depth), value
vec(size: size, depth: depth, tree: tree)
end
@doc """
Given a vector, an accumulator, and a function, iterate over
each item in the vector passing the item and the accumulator
to the function. The function should return the modified
accumulator.
iex> v = Vector.new([1,2,3])
iex> Vector.reduce(v, 0, &(&2 + &1))
6
"""
def reduce(vec(size: size, depth: depth, tree: tree), acc, fun) do
do_reduce tree, depth-1, size, 0, acc, fun
end
defp do_reduce(node, depth, size, index, acc, fun) when depth > 0 and is_list(node) do
Enum.reduce Enum.with_index(node), acc, fn {n, i}, acc ->
do_reduce n, depth-1, size, index + (i * @width), acc, fun
end
end
defp do_reduce(node, _, size, index, acc, fun) when is_list(node) do
Enum.reduce Enum.slice(node, 0..(size-index-1)), acc, fun
end
defp do_reduce(_, _, _, _, acc, _), do: acc
defp key(index, depth) when depth > 0, do: key(index, depth, [])
defp key(index, depth, indices) when depth > 0 do
level = (depth - 1) * @bits
indices = indices ++ [(index >>> level) &&& @mask]
key(index, depth - 1, indices)
end
defp key(_, _, indices), do: indices
defp tree_from_list(list, depth) when depth > 1 do
list
|> Enum.chunk(@width, @width, List.duplicate(nil, @width))
|> tree_from_list(depth - 1)
end
defp tree_from_list(list, _), do: list
defp do_get(node, [idx | rest_key]) do
node = Enum.at(node, idx)
do_get(node, rest_key)
end
defp do_get(node, []), do: node
defp do_put(tree, [idx | rest_key], value) do
rest = do_put(Enum.at(tree, idx) || [], rest_key, value)
if length(tree) <= idx do # expand this node
tree = tree ++ List.duplicate(nil, idx - length(tree) + 1)
end
List.replace_at tree, idx, rest
end
defp do_put(_, [], value), do: value
end
ExUnit.start
defmodule VectorTest do
use ExUnit.Case
test "put" do
v = Vector.new
v = Vector.put(v, 0, "first")
assert v == {Vector, 1, 1, ["first"]}
v = Vector.put(v, 1, "second")
assert v == {Vector, 2, 1, ["first", "second"]}
v = Vector.put(v, 2, "third")
assert v == {Vector, 3, 1, ["first", "second", "third"]}
v = Vector.put(v, 3, "fourth")
assert v == {Vector, 4, 1, ["first", "second", "third", "fourth"]}
v = Vector.put(v, 4, "fifth")
assert v == {Vector, 5, 2, [["first", "second", "third", "fourth"], ["fifth"]]}
v = Vector.put(v, 2, "third changed")
assert v == {Vector, 5, 2, [["first", "second", "third changed", "fourth"], ["fifth"]]}
end
test "new" do
v = Vector.new(List.duplicate(1, 5))
assert v == {Vector, 5, 2, [[1, 1, 1, 1], [1, nil, nil, nil]]}
v = Vector.new(List.duplicate(1, 64))
assert v == {Vector, 64, 3, [
[[1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1]],
[[1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1]],
[[1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1]],
[[1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1], [1, 1, 1, 1]]
]}
end
test "reduce" do
v = Vector.new([1,2,3,4,5,6])
sum = Vector.reduce(v, 0, &(&1 + &2))
assert sum == 21
end
@size 100_000
test "creation speed" do
{microsecs, _} = :timer.tc fn ->
List.duplicate("foo", @size)
end
IO.puts "List creation took #{microsecs} microsecs" # 2,815 microsecs
list = List.duplicate("foo", @size)
{microsecs, _} = :timer.tc fn ->
Vector.new(list)
end
IO.puts "Vector creation took #{microsecs} microsecs" # 18,996 microsecs
end
test "iteration speed" do
list = List.duplicate("foo", @size)
{microsecs, _} = :timer.tc fn ->
Enum.reduce list, 0, fn _, count -> count + 1 end
end
IO.puts "List traversal took #{microsecs} microsecs" # 1,605 microsecs
list = List.duplicate("foo", @size)
vector = Vector.new(list)
{microsecs, _} = :timer.tc fn ->
Vector.reduce vector, 0, fn _, count -> count + 1 end
end
IO.puts "Vector traversal took #{microsecs} microsecs" # 13,372 microsecs
end
test "access speed" do
list = List.duplicate("foo", @size)
{microsecs, _} = :timer.tc fn ->
assert Enum.at(list, @size-1) == "foo"
end
IO.puts "List access took #{microsecs} microsecs" # 997 microsecs
list = List.duplicate("foo", @size)
vector = Vector.new(list)
{microsecs, _} = :timer.tc fn ->
assert Vector.get(vector, @size-1) == "foo"
end
IO.puts "Vector access took #{microsecs} microsecs" # 3 microsecs
end
end