v.logger.WithError(err).Error("stat failed")
return nil
}
- devnum := fi.Sys().(*syscall.Stat_t).Dev
+ // uint64() cast here supports GOOS=darwin where Dev is
+ // int32. If the device number is negative, the unsigned
+ // devnum won't be the real device number any more, but that's
+ // fine -- all we care about is getting the same number each
+ // time.
+ devnum := uint64(fi.Sys().(*syscall.Stat_t).Dev)
var fs syscall.Statfs_t
if err := syscall.Statfs(v.Root, &fs); err != nil {
continue
}
blockdirpath := filepath.Join(v.Root, subdir)
- blockdir, err := v.os.Open(blockdirpath)
- if err != nil {
- v.logger.WithError(err).Errorf("error reading %q", blockdirpath)
- return fmt.Errorf("error reading %q: %s", blockdirpath, err)
- }
- v.os.stats.TickOps("readdir")
- v.os.stats.Tick(&v.os.stats.ReaddirOps)
- // ReadDir() (compared to Readdir(), which returns
- // FileInfo structs) helps complete the sequence of
- // readdirent calls as quickly as possible, reducing
- // the likelihood of NFS EBADCOOKIE (523) errors.
- dirents, err := blockdir.ReadDir(-1)
- blockdir.Close()
- if err != nil {
- v.logger.WithError(err).Errorf("error reading %q", blockdirpath)
- return fmt.Errorf("error reading %q: %s", blockdirpath, err)
+
+ var dirents []os.DirEntry
+ for attempt := 0; ; attempt++ {
+ v.os.stats.TickOps("readdir")
+ v.os.stats.Tick(&v.os.stats.ReaddirOps)
+ dirents, err = os.ReadDir(blockdirpath)
+ if err == nil {
+ break
+ } else if attempt < 5 && strings.Contains(err.Error(), "errno 523") {
+ // EBADCOOKIE (NFS stopped accepting
+ // our readdirent cookie) -- retry a
+ // few times before giving up
+ v.logger.WithError(err).Printf("retry after error reading %s", blockdirpath)
+ continue
+ } else {
+ return err
+ }
}
+
for _, dirent := range dirents {
fileInfo, err := dirent.Info()
if os.IsNotExist(err) {