Skip to content

Commit 7ba590d

Browse files
committed
More realistic row overhead estimate
Some experimentation suggests the row overhead for MySQL and Postgresql is 130-150 bytes beyond the size of the key and value columns. On Sqlite it is more like 90 bytes though, but lets go for the worst case.
1 parent 0184482 commit 7ba590d

File tree

7 files changed

+71
-72
lines changed

7 files changed

+71
-72
lines changed

app/models/solid_cache/entry.rb

+5-7
Original file line numberDiff line numberDiff line change
@@ -4,12 +4,10 @@ module SolidCache
44
class Entry < Record
55
include Expiration, Size
66

7-
ID_BYTE_SIZE = 8
8-
CREATED_AT_BYTE_SIZE = 8
9-
KEY_HASH_BYTE_SIZE = 8
10-
VALUE_BYTE_SIZE = 4
11-
FIXED_SIZE_COLUMNS_BYTE_SIZE = ID_BYTE_SIZE + CREATED_AT_BYTE_SIZE + KEY_HASH_BYTE_SIZE + VALUE_BYTE_SIZE
12-
7+
# The estimated cost of an extra row in bytes, including fixed size columns, overhead, indexes and free space
8+
# Based on expirimentation on SQLite, MySQL and Postgresql.
9+
# A bit high for SQLite (more like 90 bytes), but about right for MySQL/Postgresql.
10+
ESTIMATED_ROW_OVERHEAD = 140
1311
KEY_HASH_ID_RANGE = -(2**63)..(2**63 - 1)
1412

1513
class << self
@@ -167,7 +165,7 @@ def key_hash_for(key)
167165
end
168166

169167
def byte_size_for(payload)
170-
payload[:key].to_s.bytesize + payload[:value].to_s.bytesize + FIXED_SIZE_COLUMNS_BYTE_SIZE
168+
payload[:key].to_s.bytesize + payload[:value].to_s.bytesize + ESTIMATED_ROW_OVERHEAD
171169
end
172170
end
173171
end

docker-compose.yml

+4-3
Original file line numberDiff line numberDiff line change
@@ -1,21 +1,22 @@
11
version: "3.8"
22

33
volumes:
4-
db: {}
4+
mysql: {}
5+
postgres: {}
56

67
services:
78
postgres:
89
image: postgres:15.1
910
environment:
1011
POSTGRES_HOST_AUTH_METHOD: "trust"
1112
volumes:
12-
- db:/var/lib/postgres
13+
- postgres:/var/lib/postgres
1314
ports: [ "127.0.0.1:55432:5432" ]
1415
mysql:
1516
image: mysql:8.0.31
1617
environment:
1718
MYSQL_ALLOW_EMPTY_PASSWORD: "yes"
1819
volumes:
19-
- db:/var/lib/mysql
20+
- mysql:/var/lib/mysql
2021
ports: [ "127.0.0.1:33060:3306" ]
2122

test/dummy/config/environments/development.rb

+1-1
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@
3030
else
3131
config.action_controller.perform_caching = false
3232

33-
config.cache_store = :null_store
33+
config.cache_store = :solid_cache_store
3434
end
3535

3636
# Print deprecation notices to the Rails logger.

test/models/solid_cache/entry/size/estimate_test.rb

+26-26
Original file line numberDiff line numberDiff line change
@@ -11,21 +11,21 @@ class EntrySizeEstimateTest < ActiveSupport::TestCase
1111
test "gets exact estimate when samples sizes are big enough" do
1212
write_entries(value_lengths: [ 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ])
1313

14-
assert_equal 415, estimate(samples: 12)
15-
assert_equal 415, estimate(samples: 10)
16-
assert_equal 456, estimate(samples: 6)
17-
assert_equal 457, estimate(samples: 5)
14+
assert_equal 1535, estimate(samples: 12)
15+
assert_equal 1535, estimate(samples: 10)
16+
assert_equal 1688, estimate(samples: 6)
17+
assert_equal 1689, estimate(samples: 5)
1818
end
1919

2020
test "test larger sample estimates" do
2121
values_lengths = with_fixed_srand(1) { 1000.times.map { (rand**2 * 1000).to_i } }
2222
write_entries(value_lengths: values_lengths)
2323

24-
assert_equal 369257, estimate(samples: 1000)
25-
assert_equal 369550, estimate(samples: 500)
26-
with_fixed_srand(1) { assert_equal 383576, estimate(samples: 100) }
27-
with_fixed_srand(1) { assert_equal 357109, estimate(samples: 50) }
28-
with_fixed_srand(1) { assert_equal 326614, estimate(samples: 10) }
24+
assert_equal 481257, estimate(samples: 1000)
25+
assert_equal 481662, estimate(samples: 500)
26+
with_fixed_srand(1) { assert_equal 501624, estimate(samples: 100) }
27+
with_fixed_srand(1) { assert_equal 477621, estimate(samples: 50) }
28+
with_fixed_srand(1) { assert_equal 471878, estimate(samples: 10) }
2929
end
3030

3131
test "test with gaps in records estimates" do
@@ -34,12 +34,12 @@ class EntrySizeEstimateTest < ActiveSupport::TestCase
3434
first_mod = Entry.first.id % 3
3535
Entry.where("id % 3 = #{first_mod}").delete_all
3636

37-
assert_equal 249940, estimate(samples: 1000)
38-
assert_equal 250037, estimate(samples: 500)
39-
with_fixed_srand(1) { assert_equal 249354, estimate(samples: 334) }
40-
with_fixed_srand(1) { assert_equal 267523, estimate(samples: 100) }
41-
with_fixed_srand(1) { assert_equal 257970, estimate(samples: 50) }
42-
with_fixed_srand(1) { assert_equal 203365, estimate(samples: 10) }
37+
assert_equal 324532, estimate(samples: 1000)
38+
assert_equal 324741, estimate(samples: 500)
39+
with_fixed_srand(1) { assert_equal 323946, estimate(samples: 334) }
40+
with_fixed_srand(1) { assert_equal 345103, estimate(samples: 100) }
41+
with_fixed_srand(1) { assert_equal 335770, estimate(samples: 50) }
42+
with_fixed_srand(1) { assert_equal 281944, estimate(samples: 10) }
4343
end
4444

4545
test "test with more gaps in records estimates" do
@@ -48,12 +48,12 @@ class EntrySizeEstimateTest < ActiveSupport::TestCase
4848
first_mod = Entry.first.id % 4
4949
Entry.where("id % 4 != #{first_mod}").delete_all
5050

51-
assert_equal 92304, estimate(samples: 1000)
52-
assert_equal 92592, estimate(samples: 500)
53-
with_fixed_srand(1) { assert_equal 92519, estimate(samples: 250) }
54-
with_fixed_srand(1) { assert_equal 95475, estimate(samples: 100) }
55-
with_fixed_srand(1) { assert_equal 101601, estimate(samples: 50) }
56-
with_fixed_srand(1) { assert_equal 13362, estimate(samples: 10) }
51+
assert_equal 120304, estimate(samples: 1000)
52+
assert_equal 121488, estimate(samples: 500)
53+
with_fixed_srand(1) { assert_equal 121188, estimate(samples: 250) }
54+
with_fixed_srand(1) { assert_equal 126768, estimate(samples: 100) }
55+
with_fixed_srand(1) { assert_equal 132657, estimate(samples: 50) }
56+
with_fixed_srand(1) { assert_equal 25537, estimate(samples: 10) }
5757
end
5858

5959
test "overestimate when all samples sizes are the same" do
@@ -62,11 +62,11 @@ class EntrySizeEstimateTest < ActiveSupport::TestCase
6262
# estimate in this case.
6363
write_entries(value_lengths: [1] * 1000)
6464

65-
assert_equal 37000, estimate(samples: 1000)
66-
assert_equal 73963, estimate(samples: 999)
67-
assert_equal 55500, estimate(samples: 500)
68-
with_fixed_srand(1) { assert_equal 67648, estimate(samples: 6) }
69-
with_fixed_srand(1) { assert_equal 81178, estimate(samples: 5) }
65+
assert_equal 149000, estimate(samples: 1000)
66+
assert_equal 297851, estimate(samples: 999)
67+
assert_equal 223500, estimate(samples: 500)
68+
with_fixed_srand(1) { assert_equal 272422, estimate(samples: 6) }
69+
with_fixed_srand(1) { assert_equal 326906, estimate(samples: 5) }
7070
end
7171

7272
private

test/models/solid_cache/entry/size/moving_average_estimate_test.rb

+7-7
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ class EntrySizeMovingAverageEstimateTest < ActiveSupport::TestCase
1313

1414
estimate = Entry::Size::MovingAverageEstimate.new(samples: 12)
1515
assert_predicate estimate, :exact?
16-
assert_equal 415, estimate.size
16+
assert_equal 1535, estimate.size
1717
end
1818

1919
test "tracks moving average" do
@@ -22,24 +22,24 @@ class EntrySizeMovingAverageEstimateTest < ActiveSupport::TestCase
2222
Entry.write Entry::Size::MovingAverageEstimate::ESTIMATES_KEY, "4637774|4754378|7588547"
2323

2424
with_fixed_srand(1) do
25-
assert_equal 10075987, estimate(samples: 1)
25+
assert_equal 10449357, estimate(samples: 1)
2626
end
2727

28-
assert_equal "4754378|7588547|17885035", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
28+
assert_equal "4754378|7588547|19005147", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
2929
end
3030

3131
test "appends to moving average when less than required items" do
3232
write_entries(value_lengths: 5000.times.to_a)
3333

3434
assert_nil Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
3535

36-
with_fixed_srand(1) { assert_equal 19872121, estimate(samples: 2) }
36+
with_fixed_srand(1) { assert_equal 20991897, estimate(samples: 2) }
3737

38-
assert_equal "19872121", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
38+
assert_equal "20991897", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
3939

40-
with_fixed_srand(2) { assert_equal 11077118, estimate(samples: 2) }
40+
with_fixed_srand(2) { assert_equal 11917062, estimate(samples: 2) }
4141

42-
assert_equal "19872121|2282115", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
42+
assert_equal "20991897|2842227", Entry.read(Entry::Size::MovingAverageEstimate::ESTIMATES_KEY)
4343
end
4444

4545
private

test/models/solid_cache/entry/size_test.rb

+25-25
Original file line numberDiff line numberDiff line change
@@ -11,20 +11,20 @@ class EntrySizeTest < ActiveSupport::TestCase
1111
test "gets exact estimate when samples sizes are big enough" do
1212
write_entries(value_lengths: [ 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ])
1313

14-
assert_equal 415, Entry.estimated_size(samples: 12)
15-
assert_equal 533, Entry.estimated_size(samples: 10)
16-
assert_equal 537, Entry.estimated_size(samples: 6)
14+
assert_equal 1535, Entry.estimated_size(samples: 12)
15+
assert_equal 1878, Entry.estimated_size(samples: 10)
16+
assert_equal 1882, Entry.estimated_size(samples: 6)
1717
end
1818

1919
test "test larger sample estimates" do
2020
values_lengths = with_fixed_srand(1) { 1000.times.map { (rand**2 * 1000).to_i } }
2121
write_entries(value_lengths: values_lengths)
2222

23-
assert_equal 369257, Entry.estimated_size(samples: 1000)
24-
assert_equal 369926, Entry.estimated_size(samples: 501)
25-
with_fixed_srand(1) { assert_equal 383898, Entry.estimated_size(samples: 100) }
26-
with_fixed_srand(1) { assert_equal 357433, Entry.estimated_size(samples: 50) }
27-
with_fixed_srand(1) { assert_equal 326934, Entry.estimated_size(samples: 10) }
23+
assert_equal 481257, Entry.estimated_size(samples: 1000)
24+
assert_equal 482262, Entry.estimated_size(samples: 501)
25+
with_fixed_srand(1) { assert_equal 502065, Entry.estimated_size(samples: 100) }
26+
with_fixed_srand(1) { assert_equal 478066, Entry.estimated_size(samples: 50) }
27+
with_fixed_srand(1) { assert_equal 472343, Entry.estimated_size(samples: 10) }
2828
end
2929

3030
test "test with gaps in records estimates" do
@@ -33,12 +33,12 @@ class EntrySizeTest < ActiveSupport::TestCase
3333
first_mod = Entry.first.id % 3
3434
Entry.where("id % 3 = #{first_mod}").delete_all
3535

36-
assert_equal 249940, Entry.estimated_size(samples: 1000)
37-
assert_equal 250120, Entry.estimated_size(samples: 500)
38-
with_fixed_srand(1) { assert_equal 249639, Entry.estimated_size(samples: 334) }
39-
with_fixed_srand(1) { assert_equal 267921, Entry.estimated_size(samples: 100) }
40-
with_fixed_srand(1) { assert_equal 258414, Entry.estimated_size(samples: 50) }
41-
with_fixed_srand(1) { assert_equal 203756, Entry.estimated_size(samples: 10) }
36+
assert_equal 324532, Entry.estimated_size(samples: 1000)
37+
assert_equal 324936, Entry.estimated_size(samples: 500)
38+
with_fixed_srand(1) { assert_equal 324567, Entry.estimated_size(samples: 334) }
39+
with_fixed_srand(1) { assert_equal 345649, Entry.estimated_size(samples: 100) }
40+
with_fixed_srand(1) { assert_equal 336366, Entry.estimated_size(samples: 50) }
41+
with_fixed_srand(1) { assert_equal 282492, Entry.estimated_size(samples: 10) }
4242
end
4343

4444
test "test with more gaps in records estimates" do
@@ -47,12 +47,12 @@ class EntrySizeTest < ActiveSupport::TestCase
4747
first_mod = Entry.first.id % 4
4848
Entry.where("id % 4 != #{first_mod}").delete_all
4949

50-
assert_equal 92304, Entry.estimated_size(samples: 1000)
51-
assert_equal 92674, Entry.estimated_size(samples: 501)
52-
with_fixed_srand(1) { assert_equal 92566, Entry.estimated_size(samples: 250) }
53-
with_fixed_srand(1) { assert_equal 95594, Entry.estimated_size(samples: 100) }
54-
with_fixed_srand(1) { assert_equal 101852, Entry.estimated_size(samples: 50) }
55-
with_fixed_srand(1) { assert_equal 13377, Entry.estimated_size(samples: 10) }
50+
assert_equal 120304, Entry.estimated_size(samples: 1000)
51+
assert_equal 121683, Entry.estimated_size(samples: 501)
52+
with_fixed_srand(1) { assert_equal 121240, Entry.estimated_size(samples: 250) }
53+
with_fixed_srand(1) { assert_equal 126976, Entry.estimated_size(samples: 100) }
54+
with_fixed_srand(1) { assert_equal 133014, Entry.estimated_size(samples: 50) }
55+
with_fixed_srand(1) { assert_equal 25596, Entry.estimated_size(samples: 10) }
5656
end
5757

5858
test "overestimate when all samples sizes are the same" do
@@ -61,11 +61,11 @@ class EntrySizeTest < ActiveSupport::TestCase
6161
# estimate in this case.
6262
write_entries(value_lengths: [1] * 1000)
6363

64-
assert_equal 37000, Entry.estimated_size(samples: 1000)
65-
assert_equal 74008, Entry.estimated_size(samples: 999)
66-
assert_equal 55582, Entry.estimated_size(samples: 501)
67-
with_fixed_srand(1) { assert_equal 67761, Entry.estimated_size(samples: 6) }
68-
with_fixed_srand(1) { assert_equal 81304, Entry.estimated_size(samples: 5) }
64+
assert_equal 149000, Entry.estimated_size(samples: 1000)
65+
assert_equal 297897, Entry.estimated_size(samples: 999)
66+
assert_equal 223695, Entry.estimated_size(samples: 501)
67+
with_fixed_srand(1) { assert_equal 272741, Entry.estimated_size(samples: 6) }
68+
with_fixed_srand(1) { assert_equal 327280, Entry.estimated_size(samples: 5) }
6969
end
7070

7171
private

test/models/solid_cache/entry_test.rb

+3-3
Original file line numberDiff line numberDiff line change
@@ -54,11 +54,11 @@ class EntryTest < ActiveSupport::TestCase
5454

5555
test "byte_size" do
5656
Entry.write "hello".b, "test"
57-
assert_equal 37, Entry.uncached { Entry.last.byte_size }
57+
assert_equal 149, Entry.uncached { Entry.last.byte_size }
5858
Entry.write "hello".b, "12345"
59-
assert_equal 38, Entry.uncached { Entry.last.byte_size }
59+
assert_equal 150, Entry.uncached { Entry.last.byte_size }
6060
Entry.write "hi".b, "12345"
61-
assert_equal 35, Entry.uncached { Entry.last.byte_size }
61+
assert_equal 147, Entry.uncached { Entry.last.byte_size }
6262
end
6363

6464
private

0 commit comments

Comments
 (0)