Skip to content

Commit 5a5c1ea

Browse files
committed
fix: record cache entries for files that don't match formatters
Signed-off-by: Brian McGee <[email protected]>
1 parent 618f6f7 commit 5a5c1ea

11 files changed

+215
-171
lines changed

cache/cache.go

+19-37
Original file line numberDiff line numberDiff line change
@@ -5,9 +5,7 @@ import (
55
"crypto/sha1"
66
"encoding/hex"
77
"fmt"
8-
"io/fs"
98
"os"
10-
"path/filepath"
119
"runtime"
1210
"time"
1311

@@ -180,7 +178,7 @@ func putEntry(bucket *bolt.Bucket, path string, entry *Entry) error {
180178

181179
// ChangeSet is used to walk a filesystem, starting at root, and outputting any new or changed paths using pathsCh.
182180
// It determines if a path is new or has changed by comparing against cache entries.
183-
func ChangeSet(ctx context.Context, walker walk.Walker, pathsCh chan<- string) error {
181+
func ChangeSet(ctx context.Context, walker walk.Walker, filesCh chan<- *walk.File) error {
184182
start := time.Now()
185183

186184
defer func() {
@@ -198,24 +196,21 @@ func ChangeSet(ctx context.Context, walker walk.Walker, pathsCh chan<- string) e
198196
}
199197
}()
200198

201-
// for quick removal of tree root from paths
202-
relPathOffset := len(walker.Root()) + 1
203-
204-
return walker.Walk(ctx, func(path string, info fs.FileInfo, err error) error {
199+
return walker.Walk(ctx, func(file *walk.File, err error) error {
205200
select {
206201
case <-ctx.Done():
207202
return ctx.Err()
208203
default:
209204
if err != nil {
210205
return fmt.Errorf("%w: failed to walk path", err)
211-
} else if info.IsDir() {
206+
} else if file.Info.IsDir() {
212207
// ignore directories
213208
return nil
214209
}
215210
}
216211

217212
// ignore symlinks
218-
if info.Mode()&os.ModeSymlink == os.ModeSymlink {
213+
if file.Info.Mode()&os.ModeSymlink == os.ModeSymlink {
219214
return nil
220215
}
221216

@@ -229,13 +224,12 @@ func ChangeSet(ctx context.Context, walker walk.Walker, pathsCh chan<- string) e
229224
bucket = tx.Bucket([]byte(pathsBucket))
230225
}
231226

232-
relPath := path[relPathOffset:]
233-
cached, err := getEntry(bucket, relPath)
227+
cached, err := getEntry(bucket, file.RelPath)
234228
if err != nil {
235229
return err
236230
}
237231

238-
changedOrNew := cached == nil || !(cached.Modified == info.ModTime() && cached.Size == info.Size())
232+
changedOrNew := cached == nil || !(cached.Modified == file.Info.ModTime() && cached.Size == file.Info.Size())
239233

240234
stats.Add(stats.Traversed, 1)
241235
if !changedOrNew {
@@ -250,7 +244,7 @@ func ChangeSet(ctx context.Context, walker walk.Walker, pathsCh chan<- string) e
250244
case <-ctx.Done():
251245
return ctx.Err()
252246
default:
253-
pathsCh <- relPath
247+
filesCh <- file
254248
}
255249

256250
// close the current tx if we have reached the batch size
@@ -266,47 +260,35 @@ func ChangeSet(ctx context.Context, walker walk.Walker, pathsCh chan<- string) e
266260
}
267261

268262
// Update is used to record updated cache information for the specified list of paths.
269-
func Update(treeRoot string, paths []string) (int, error) {
263+
func Update(files []*walk.File) error {
270264
start := time.Now()
271265
defer func() {
272-
logger.Infof("finished updating %v paths in %v", len(paths), time.Since(start))
266+
logger.Infof("finished processing %v paths in %v", len(files), time.Since(start))
273267
}()
274268

275-
if len(paths) == 0 {
276-
return 0, nil
269+
if len(files) == 0 {
270+
return nil
277271
}
278272

279-
var changes int
280-
281-
return changes, db.Update(func(tx *bolt.Tx) error {
273+
return db.Update(func(tx *bolt.Tx) error {
282274
bucket := tx.Bucket([]byte(pathsBucket))
283275

284-
for _, path := range paths {
285-
cached, err := getEntry(bucket, path)
286-
if err != nil {
287-
return err
288-
}
289-
290-
pathInfo, err := os.Stat(filepath.Join(treeRoot, path))
276+
for _, f := range files {
277+
currentInfo, err := os.Stat(f.Path)
291278
if err != nil {
292279
return err
293280
}
294281

295-
if cached == nil || !(cached.Modified == pathInfo.ModTime() && cached.Size == pathInfo.Size()) {
296-
changes += 1
297-
} else {
298-
// no change to write
299-
continue
282+
if !(f.Info.ModTime() == currentInfo.ModTime() && f.Info.Size() == currentInfo.Size()) {
283+
stats.Add(stats.Formatted, 1)
300284
}
301285

302-
stats.Add(stats.Formatted, 1)
303-
304286
entry := Entry{
305-
Size: pathInfo.Size(),
306-
Modified: pathInfo.ModTime(),
287+
Size: currentInfo.Size(),
288+
Modified: currentInfo.ModTime(),
307289
}
308290

309-
if err = putEntry(bucket, path, &entry); err != nil {
291+
if err = putEntry(bucket, f.RelPath, &entry); err != nil {
310292
return err
311293
}
312294
}

cli/format.go

+26-33
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@ import (
55
"context"
66
"errors"
77
"fmt"
8-
"io/fs"
98
"os"
109
"os/signal"
1110
"path/filepath"
@@ -35,8 +34,8 @@ var (
3534
globalExcludes []glob.Glob
3635
formatters map[string]*format.Formatter
3736
pipelines map[string]*format.Pipeline
38-
pathsCh chan string
39-
processedCh chan string
37+
filesCh chan *walk.File
38+
processedCh chan *walk.File
4039

4140
ErrFailOnChange = errors.New("unexpected changes detected, --fail-on-change is enabled")
4241
)
@@ -142,10 +141,10 @@ func (f *Format) Run() (err error) {
142141

143142
// create a channel for paths to be processed
144143
// we use a multiple of batch size here to allow for greater concurrency
145-
pathsCh = make(chan string, BatchSize*runtime.NumCPU())
144+
filesCh = make(chan *walk.File, BatchSize*runtime.NumCPU())
146145

147146
// create a channel for tracking paths that have been processed
148-
processedCh = make(chan string, cap(pathsCh))
147+
processedCh = make(chan *walk.File, cap(filesCh))
149148

150149
// start concurrent processing tasks
151150
eg.Go(updateCache(ctx))
@@ -185,26 +184,26 @@ func walkFilesystem(ctx context.Context) func() error {
185184
return fmt.Errorf("failed to create walker: %w", err)
186185
}
187186

188-
defer close(pathsCh)
187+
defer close(filesCh)
189188

190189
if Cli.NoCache {
191-
return walker.Walk(ctx, func(path string, info fs.FileInfo, err error) error {
190+
return walker.Walk(ctx, func(file *walk.File, err error) error {
192191
select {
193192
case <-ctx.Done():
194193
return ctx.Err()
195194
default:
196195
// ignore symlinks and directories
197-
if !(info.IsDir() || info.Mode()&os.ModeSymlink == os.ModeSymlink) {
196+
if !(file.Info.IsDir() || file.Info.Mode()&os.ModeSymlink == os.ModeSymlink) {
198197
stats.Add(stats.Traversed, 1)
199198
stats.Add(stats.Emitted, 1)
200-
pathsCh <- path
199+
filesCh <- file
201200
}
202201
return nil
203202
}
204203
})
205204
}
206205

207-
if err = cache.ChangeSet(ctx, walker, pathsCh); err != nil {
206+
if err = cache.ChangeSet(ctx, walker, filesCh); err != nil {
208207
return fmt.Errorf("failed to generate change set: %w", err)
209208
}
210209
return nil
@@ -213,19 +212,11 @@ func walkFilesystem(ctx context.Context) func() error {
213212

214213
func updateCache(ctx context.Context) func() error {
215214
return func() error {
216-
batch := make([]string, 0, BatchSize)
217-
218-
var changes int
215+
batch := make([]*walk.File, 0, BatchSize)
219216

220217
processBatch := func() error {
221-
if Cli.NoCache {
222-
changes += len(batch)
223-
} else {
224-
count, err := cache.Update(Cli.TreeRoot, batch)
225-
if err != nil {
226-
return err
227-
}
228-
changes += count
218+
if err := cache.Update(batch); err != nil {
219+
return err
229220
}
230221
batch = batch[:0]
231222
return nil
@@ -254,7 +245,7 @@ func updateCache(ctx context.Context) func() error {
254245
return err
255246
}
256247

257-
if Cli.FailOnChange && changes != 0 {
248+
if Cli.FailOnChange && stats.Value(stats.Formatted) != 0 {
258249
return ErrFailOnChange
259250
}
260251

@@ -265,28 +256,28 @@ func updateCache(ctx context.Context) func() error {
265256

266257
func applyFormatters(ctx context.Context) func() error {
267258
fg, ctx := errgroup.WithContext(ctx)
268-
batches := make(map[string][]string)
259+
batches := make(map[string][]*walk.File)
269260

270-
tryApply := func(key string, path string) {
261+
tryApply := func(key string, file *walk.File) {
271262
batch, ok := batches[key]
272263
if !ok {
273-
batch = make([]string, 0, BatchSize)
264+
batch = make([]*walk.File, 0, BatchSize)
274265
}
275-
batch = append(batch, path)
266+
batch = append(batch, file)
276267
batches[key] = batch
277268

278269
if len(batch) == BatchSize {
279270
pipeline := pipelines[key]
280271

281272
// copy the batch
282-
paths := make([]string, len(batch))
283-
copy(paths, batch)
273+
files := make([]*walk.File, len(batch))
274+
copy(files, batch)
284275

285276
fg.Go(func() error {
286-
if err := pipeline.Apply(ctx, paths); err != nil {
277+
if err := pipeline.Apply(ctx, files); err != nil {
287278
return err
288279
}
289-
for _, path := range paths {
280+
for _, path := range files {
290281
processedCh <- path
291282
}
292283
return nil
@@ -322,17 +313,19 @@ func applyFormatters(ctx context.Context) func() error {
322313
close(processedCh)
323314
}()
324315

325-
for path := range pathsCh {
316+
for file := range filesCh {
326317
var matched bool
327318
for key, pipeline := range pipelines {
328-
if !pipeline.Wants(path) {
319+
if !pipeline.Wants(file) {
329320
continue
330321
}
331322
matched = true
332-
tryApply(key, path)
323+
tryApply(key, file)
333324
}
334325
if matched {
335326
stats.Add(stats.Matched, 1)
327+
} else {
328+
processedCh <- file
336329
}
337330
}
338331

0 commit comments

Comments
 (0)