fix(tier): preserve volume data modification time

This commit is contained in:
Chris Lu
2026-06-13 12:30:08 -07:00
parent f724828bcb
commit 8359d05ac4
3 changed files with 224 additions and 1 deletions
+8
View File
@@ -2,6 +2,7 @@ package weed_server
import (
"fmt"
"os"
"time"
"github.com/seaweedfs/seaweedfs/weed/pb/volume_server_pb"
@@ -28,6 +29,7 @@ func (vs *VolumeServer) VolumeTierMoveDatFromRemote(req *volume_server_pb.Volume
if storageName == "" || storageKey == "" {
return fmt.Errorf("volume %d is already on local disk", req.VolumeId)
}
remoteFileModifiedTime := v.GetVolumeInfo().GetFiles()[0].GetModifiedTime()
// check whether the local .dat already exists
_, ok := v.DataBackend.(*backend.DiskFile)
@@ -62,6 +64,12 @@ func (vs *VolumeServer) VolumeTierMoveDatFromRemote(req *volume_server_pb.Volume
if err != nil {
return fmt.Errorf("backend %s copy file %s: %v", storageName, v.FileName(".dat"), err)
}
if remoteFileModifiedTime > 0 {
modifiedTime := time.Unix(int64(remoteFileModifiedTime), 0)
if err := os.Chtimes(v.FileName(".dat"), time.Now(), modifiedTime); err != nil {
return fmt.Errorf("restore data file %s modified time: %v", v.FileName(".dat"), err)
}
}
if req.KeepRemoteDatFile {
return nil
+211
View File
@@ -0,0 +1,211 @@
package weed_server
import (
"fmt"
"io"
"os"
"path/filepath"
"testing"
"time"
"google.golang.org/grpc"
"github.com/seaweedfs/seaweedfs/weed/pb/volume_server_pb"
"github.com/seaweedfs/seaweedfs/weed/stats"
"github.com/seaweedfs/seaweedfs/weed/storage"
"github.com/seaweedfs/seaweedfs/weed/storage/backend"
"github.com/seaweedfs/seaweedfs/weed/storage/needle"
"github.com/seaweedfs/seaweedfs/weed/storage/types"
"github.com/seaweedfs/seaweedfs/weed/util"
)
const tierTimestampTestBackendName = "tier_timestamp_test.default"
type discardServerStream[T any] struct {
grpc.ServerStream
}
func (s *discardServerStream[T]) Send(*T) error {
return nil
}
type tierTimestampTestBackend struct {
root string
}
func (b *tierTimestampTestBackend) ToProperties() map[string]string {
return map[string]string{"root": b.root}
}
func (b *tierTimestampTestBackend) NewStorageFile(key string, volumeInfo *volume_server_pb.VolumeInfo) backend.BackendStorageFile {
return &tierTimestampTestBackendFile{
path: filepath.Join(b.root, key),
volumeInfo: volumeInfo,
}
}
func (b *tierTimestampTestBackend) CopyFile(file *os.File, fn func(progressed int64, percentage float32) error) (key string, size int64, err error) {
key = "remote.dat"
fileInfo, err := file.Stat()
if err != nil {
return "", 0, err
}
output, err := os.Create(filepath.Join(b.root, key))
if err != nil {
return "", 0, err
}
defer output.Close()
size, err = io.Copy(output, io.NewSectionReader(file, 0, fileInfo.Size()))
if err == nil && fn != nil {
err = fn(size, 100)
}
return key, size, err
}
func (b *tierTimestampTestBackend) DownloadFile(fileName string, key string, fn func(progressed int64, percentage float32) error) (size int64, err error) {
input, err := os.Open(filepath.Join(b.root, key))
if err != nil {
return 0, err
}
defer input.Close()
output, err := os.Create(fileName)
if err != nil {
return 0, err
}
defer output.Close()
size, err = io.Copy(output, input)
if err == nil && fn != nil {
err = fn(size, 100)
}
return size, err
}
func (b *tierTimestampTestBackend) DeleteFile(key string) error {
return os.Remove(filepath.Join(b.root, key))
}
type tierTimestampTestBackendFile struct {
path string
volumeInfo *volume_server_pb.VolumeInfo
}
func (f *tierTimestampTestBackendFile) ReadAt(p []byte, off int64) (int, error) {
file, err := os.Open(f.path)
if err != nil {
return 0, err
}
defer file.Close()
return file.ReadAt(p, off)
}
func (f *tierTimestampTestBackendFile) WriteAt(p []byte, off int64) (int, error) {
return 0, fmt.Errorf("remote test file is read-only")
}
func (f *tierTimestampTestBackendFile) Truncate(off int64) error {
return fmt.Errorf("remote test file is read-only")
}
func (f *tierTimestampTestBackendFile) Close() error {
return nil
}
func (f *tierTimestampTestBackendFile) GetStat() (datSize int64, modTime time.Time, err error) {
files := f.volumeInfo.GetFiles()
if len(files) == 0 {
return 0, time.Time{}, fmt.Errorf("remote file info not found")
}
return int64(files[0].GetFileSize()), time.Unix(int64(files[0].GetModifiedTime()), 0), nil
}
func (f *tierTimestampTestBackendFile) Name() string {
return f.path
}
func (f *tierTimestampTestBackendFile) Sync() error {
return nil
}
func TestVolumeTierMoveDatPreservesModifiedTime(t *testing.T) {
dataDir := t.TempDir()
remoteDir := t.TempDir()
testBackend := &tierTimestampTestBackend{root: remoteDir}
backend.BackendStorages[tierTimestampTestBackendName] = testBackend
t.Cleanup(func() {
delete(backend.BackendStorages, tierTimestampTestBackendName)
})
store := storage.NewStore(
nil,
"localhost",
8080,
18080,
"http://localhost:8080",
"store-id",
[]string{dataDir},
[]int32{10},
[]util.MinFreeSpace{{}},
"",
storage.NeedleMapInMemory,
[]types.DiskType{types.HardDriveType},
nil,
0,
stats.DefaultDiskIOProbeConfig(),
)
t.Cleanup(store.Close)
const volumeId = needle.VolumeId(1)
if err := store.AddVolume(volumeId, "", storage.NeedleMapInMemory, "000", "", 0, needle.Version3, 0, types.HardDriveType, 0); err != nil {
t.Fatalf("add volume: %v", err)
}
volume := store.GetVolume(volumeId)
dataFileName := volume.FileName(".dat")
sourceModifiedTime := time.Unix(1_700_000_000, 0)
if err := os.Chtimes(dataFileName, sourceModifiedTime, sourceModifiedTime); err != nil {
t.Fatalf("set source modified time: %v", err)
}
volumeServer := &VolumeServer{store: store}
if err := volumeServer.VolumeTierMoveDatToRemote(
&volume_server_pb.VolumeTierMoveDatToRemoteRequest{
VolumeId: uint32(volumeId),
DestinationBackendName: tierTimestampTestBackendName,
},
&discardServerStream[volume_server_pb.VolumeTierMoveDatToRemoteResponse]{},
); err != nil {
t.Fatalf("move data to remote: %v", err)
}
remoteFiles := volume.GetVolumeInfo().GetFiles()
if len(remoteFiles) != 1 {
t.Fatalf("remote file count = %d, want 1", len(remoteFiles))
}
if got := remoteFiles[0].GetModifiedTime(); got != uint64(sourceModifiedTime.Unix()) {
t.Fatalf("remote modified time = %d, want %d", got, sourceModifiedTime.Unix())
}
if _, err := os.Stat(dataFileName); !os.IsNotExist(err) {
t.Fatalf("local data file still exists after upload: %v", err)
}
if err := volumeServer.VolumeTierMoveDatFromRemote(
&volume_server_pb.VolumeTierMoveDatFromRemoteRequest{
VolumeId: uint32(volumeId),
},
&discardServerStream[volume_server_pb.VolumeTierMoveDatFromRemoteResponse]{},
); err != nil {
t.Fatalf("move data from remote: %v", err)
}
fileInfo, err := os.Stat(dataFileName)
if err != nil {
t.Fatalf("stat downloaded data file: %v", err)
}
if got := fileInfo.ModTime().Unix(); got != sourceModifiedTime.Unix() {
t.Fatalf("downloaded modified time = %d, want %d", got, sourceModifiedTime.Unix())
}
}
+5 -1
View File
@@ -32,6 +32,10 @@ func (vs *VolumeServer) VolumeTierMoveDatToRemote(req *volume_server_pb.VolumeTi
if !ok {
return nil // already copied to remove. fmt.Errorf("volume %d is not on local disk", req.VolumeId)
}
fileInfo, err := diskFile.File.Stat()
if err != nil {
return fmt.Errorf("stat data file %s: %v", diskFile.Name(), err)
}
// check valid storage backend type
backendStorage, found := backend.BackendStorages[req.DestinationBackendName]
@@ -78,7 +82,7 @@ func (vs *VolumeServer) VolumeTierMoveDatToRemote(req *volume_server_pb.VolumeTi
Key: key,
Offset: 0,
FileSize: uint64(size),
ModifiedTime: uint64(time.Now().Unix()),
ModifiedTime: uint64(fileInfo.ModTime().Unix()),
Extension: ".dat",
})