Skip to content

Commit 8892a92

Browse files
nlfisaacs
authored andcommitted
feat: add a validateEntry option to compact
PR-URL: #55 Credit: @nlf Close: #55 Reviewed-by: @isaacs
1 parent 460b951 commit 8892a92

File tree

3 files changed

+117
-14
lines changed

3 files changed

+117
-14
lines changed

README.md

+10-1
Original file line numberDiff line numberDiff line change
@@ -495,12 +495,21 @@ cacache.rm.content(cachePath, 'sha512-SoMeDIGest/IN+BaSE64==').then(() => {
495495
})
496496
```
497497

498-
#### <a name="index-compact"></a> `> cacache.index.compact(cache, key, matchFn) -> Promise`
498+
#### <a name="index-compact"></a> `> cacache.index.compact(cache, key, matchFn, [opts]) -> Promise`
499499

500500
Uses `matchFn`, which must be a synchronous function that accepts two entries
501501
and returns a boolean indicating whether or not the two entries match, to
502502
deduplicate all entries in the cache for the given `key`.
503503

504+
If `opts.validateEntry` is provided, it will be called as a function with the
505+
only parameter being a single index entry. The function must return a Boolean,
506+
if it returns `true` the entry is considered valid and will be kept in the index,
507+
if it returns `false` the entry will be removed from the index.
508+
509+
If `opts.validateEntry` is not provided, however, every entry in the index will
510+
be deduplicated and kept until the first `null` integrity is reached, removing
511+
all entries that were written before the `null`.
512+
504513
The deduplicated list of entries is both written to the index, replacing the
505514
existing content, and returned in the Promise.
506515

lib/entry-index.js

+28-7
Original file line numberDiff line numberDiff line change
@@ -37,15 +37,31 @@ module.exports.compact = compact
3737
async function compact (cache, key, matchFn, opts = {}) {
3838
const bucket = bucketPath(cache, key)
3939
const entries = await bucketEntries(bucket)
40-
// reduceRight because the bottom-most result is the newest
40+
const newEntries = []
41+
// we loop backwards because the bottom-most result is the newest
4142
// since we add new entries with appendFile
42-
const newEntries = entries.reduceRight((acc, newEntry) => {
43-
if (!acc.find((oldEntry) => matchFn(oldEntry, newEntry))) {
44-
acc.push(newEntry)
43+
for (let i = entries.length - 1; i >= 0; --i) {
44+
const entry = entries[i]
45+
// a null integrity could mean either a delete was appended
46+
// or the user has simply stored an index that does not map
47+
// to any content. we determine if the user wants to keep the
48+
// null integrity based on the validateEntry function passed in options.
49+
// if the integrity is null and no validateEntry is provided, we break
50+
// as we consider the null integrity to be a deletion of everything
51+
// that came before it.
52+
if (entry.integrity === null && !opts.validateEntry) {
53+
break
4554
}
4655

47-
return acc
48-
}, [])
56+
// if this entry is valid, and it is either the first entry or
57+
// the newEntries array doesn't already include an entry that
58+
// matches this one based on the provided matchFn, then we add
59+
// it to the beginning of our list
60+
if ((!opts.validateEntry || opts.validateEntry(entry) === true) &&
61+
(newEntries.length === 0 || !newEntries.find((oldEntry) => matchFn(oldEntry, entry)))) {
62+
newEntries.unshift(entry)
63+
}
64+
}
4965

5066
const newIndex = '\n' + newEntries.map((entry) => {
5167
const stringified = JSON.stringify(entry)
@@ -87,7 +103,12 @@ async function compact (cache, key, matchFn, opts = {}) {
87103
// write the file atomically
88104
await disposer(setup(), teardown, write)
89105

90-
return newEntries.map((entry) => formatEntry(cache, entry, true))
106+
// we reverse the list we generated such that the newest
107+
// entries come first in order to make looping through them easier
108+
// the true passed to formatEntry tells it to keep null
109+
// integrity values, if they made it this far it's because
110+
// validateEntry returned true, and as such we should return it
111+
return newEntries.reverse().map((entry) => formatEntry(cache, entry, true))
91112
}
92113

93114
module.exports.insert = insert

test/entry-index.js

+79-6
Original file line numberDiff line numberDiff line change
@@ -60,21 +60,94 @@ test('compact', async (t) => {
6060
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } }),
6161
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 2 } }),
6262
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 2 } }),
63-
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } }),
64-
// compact will return entries with a null integrity
65-
index.insert(CACHE, KEY, null, { metadata: { rev: 3 } })
63+
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } })
6664
])
6765

6866
const bucket = index.bucketPath(CACHE, KEY)
6967
const entries = await index.bucketEntries(bucket)
70-
t.equal(entries.length, 5, 'started with 5 entries')
68+
t.equal(entries.length, 4, 'started with 4 entries')
7169

7270
const filter = (entryA, entryB) => entryA.metadata.rev === entryB.metadata.rev
7371
const compacted = await index.compact(CACHE, KEY, filter)
74-
t.equal(compacted.length, 3, 'should return only three entries')
72+
t.equal(compacted.length, 2, 'should return only two entries')
73+
74+
const newEntries = await index.bucketEntries(bucket)
75+
t.equal(newEntries.length, 2, 'bucket was deduplicated')
76+
})
77+
78+
test('compact: treats null integrity without validateEntry as a delete', async (t) => {
79+
t.teardown(() => {
80+
index.delete.sync(CACHE, KEY)
81+
})
82+
// this one does not use Promise.all because we want to be certain
83+
// things are written in the right order
84+
await index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } })
85+
await index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 2 } })
86+
// this is a delete, revs 1, 2 and 3 will be omitted
87+
await index.insert(CACHE, KEY, null, { metadata: { rev: 3 } })
88+
await index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 4 } })
89+
90+
const bucket = index.bucketPath(CACHE, KEY)
91+
const entries = await index.bucketEntries(bucket)
92+
t.equal(entries.length, 4, 'started with 4 entries')
93+
94+
const filter = (entryA, entryB) => entryA.metadata.rev === entryB.metadata.rev
95+
const compacted = await index.compact(CACHE, KEY, filter)
96+
t.equal(compacted.length, 1, 'should return only one entry')
97+
t.equal(compacted[0].metadata.rev, 4, 'kept rev 4')
98+
99+
const newEntries = await index.bucketEntries(bucket)
100+
t.equal(newEntries.length, 1, 'bucket was deduplicated')
101+
})
102+
103+
test('compact: leverages validateEntry to skip invalid entries', async (t) => {
104+
t.teardown(() => {
105+
index.delete.sync(CACHE, KEY)
106+
})
107+
await Promise.all([
108+
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } }),
109+
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 2 } }),
110+
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 2 } }),
111+
index.insert(CACHE, KEY, INTEGRITY, { metadata: { rev: 1 } })
112+
])
113+
114+
const bucket = index.bucketPath(CACHE, KEY)
115+
const entries = await index.bucketEntries(bucket)
116+
t.equal(entries.length, 4, 'started with 4 entries')
117+
118+
const matchFn = (entryA, entryB) => entryA.metadata.rev === entryB.metadata.rev
119+
const validateEntry = (entry) => entry.metadata.rev > 1
120+
const compacted = await index.compact(CACHE, KEY, matchFn, { validateEntry })
121+
t.equal(compacted.length, 1, 'should return only one entries')
122+
t.equal(compacted[0].metadata.rev, 2, 'kept the rev 2 entry')
123+
124+
const newEntries = await index.bucketEntries(bucket)
125+
t.equal(newEntries.length, 1, 'bucket was deduplicated')
126+
})
127+
128+
test('compact: validateEntry allows for keeping null integrity', async (t) => {
129+
t.teardown(() => {
130+
index.delete.sync(CACHE, KEY)
131+
})
132+
await Promise.all([
133+
index.insert(CACHE, KEY, null, { metadata: { rev: 1 } }),
134+
index.insert(CACHE, KEY, null, { metadata: { rev: 2 } }),
135+
index.insert(CACHE, KEY, null, { metadata: { rev: 2 } }),
136+
index.insert(CACHE, KEY, null, { metadata: { rev: 1 } })
137+
])
138+
139+
const bucket = index.bucketPath(CACHE, KEY)
140+
const entries = await index.bucketEntries(bucket)
141+
t.equal(entries.length, 4, 'started with 4 entries')
142+
143+
const matchFn = (entryA, entryB) => entryA.metadata.rev === entryB.metadata.rev
144+
const validateEntry = (entry) => entry.metadata.rev > 1
145+
const compacted = await index.compact(CACHE, KEY, matchFn, { validateEntry })
146+
t.equal(compacted.length, 1, 'should return only one entry')
147+
t.equal(compacted[0].metadata.rev, 2, 'kept the rev 2 entry')
75148

76149
const newEntries = await index.bucketEntries(bucket)
77-
t.equal(newEntries.length, 3, 'bucket was deduplicated')
150+
t.equal(newEntries.length, 1, 'bucket was deduplicated')
78151
})
79152

80153
test('compact: ENOENT in chownr does not cause failure', async (t) => {

0 commit comments

Comments
 (0)