mirror of
https://github.com/seaweedfs/seaweedfs.git
synced 2024-01-19 02:48:24 +00:00
Merge pull request #375 from hxiaodon/master
supplemental data between compacting and commit compacting
This commit is contained in:
commit
79fdea0de4
|
@ -23,6 +23,9 @@ type Volume struct {
|
||||||
|
|
||||||
dataFileAccessLock sync.Mutex
|
dataFileAccessLock sync.Mutex
|
||||||
lastModifiedTime uint64 //unix time in seconds
|
lastModifiedTime uint64 //unix time in seconds
|
||||||
|
|
||||||
|
lastCompactIndexOffset uint64
|
||||||
|
lastCompactRevision uint16
|
||||||
}
|
}
|
||||||
|
|
||||||
func NewVolume(dirname string, collection string, id VolumeId, needleMapKind NeedleMapType, replicaPlacement *ReplicaPlacement, ttl *TTL) (v *Volume, e error) {
|
func NewVolume(dirname string, collection string, id VolumeId, needleMapKind NeedleMapType, replicaPlacement *ReplicaPlacement, ttl *TTL) (v *Volume, e error) {
|
||||||
|
|
|
@ -21,7 +21,6 @@ func CheckVolumeDataIntegrity(v *Volume, indexFile *os.File) error {
|
||||||
return fmt.Errorf("readLastIndexEntry %s failed: %v", indexFile.Name(), e)
|
return fmt.Errorf("readLastIndexEntry %s failed: %v", indexFile.Name(), e)
|
||||||
}
|
}
|
||||||
key, offset, size := idxFileEntry(lastIdxEntry)
|
key, offset, size := idxFileEntry(lastIdxEntry)
|
||||||
//deleted index entry could not point to deleted needle
|
|
||||||
if offset == 0 {
|
if offset == 0 {
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
|
@ -6,6 +6,7 @@ import (
|
||||||
"time"
|
"time"
|
||||||
|
|
||||||
"github.com/chrislusf/seaweedfs/weed/glog"
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
||||||
|
"github.com/chrislusf/seaweedfs/weed/util"
|
||||||
)
|
)
|
||||||
|
|
||||||
func (v *Volume) garbageLevel() float64 {
|
func (v *Volume) garbageLevel() float64 {
|
||||||
|
@ -20,7 +21,9 @@ func (v *Volume) Compact() error {
|
||||||
//glog.V(3).Infof("Got Compaction lock...")
|
//glog.V(3).Infof("Got Compaction lock...")
|
||||||
|
|
||||||
filePath := v.FileName()
|
filePath := v.FileName()
|
||||||
glog.V(3).Infof("creating copies for volume %d ...", v.Id)
|
v.lastCompactIndexOffset = v.nm.IndexFileSize()
|
||||||
|
v.lastCompactRevision = v.SuperBlock.CompactRevision
|
||||||
|
glog.V(3).Infof("creating copies for volume %d ,last offset %d...", v.Id, v.lastCompactIndexOffset)
|
||||||
return v.copyDataAndGenerateIndexFile(filePath+".cpd", filePath+".cpx")
|
return v.copyDataAndGenerateIndexFile(filePath+".cpd", filePath+".cpx")
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -38,14 +41,28 @@ func (v *Volume) commitCompact() error {
|
||||||
glog.V(3).Infof("Got Committing lock...")
|
glog.V(3).Infof("Got Committing lock...")
|
||||||
v.nm.Close()
|
v.nm.Close()
|
||||||
_ = v.dataFile.Close()
|
_ = v.dataFile.Close()
|
||||||
makeupDiff(v.FileName()+".cpd", v.FileName()+".cpx", v.FileName()+".dat", v.FileName()+".idx")
|
|
||||||
var e error
|
var e error
|
||||||
if e = os.Rename(v.FileName()+".cpd", v.FileName()+".dat"); e != nil {
|
if e = v.makeupDiff(v.FileName()+".cpd", v.FileName()+".cpx", v.FileName()+".dat", v.FileName()+".idx"); e != nil {
|
||||||
return e
|
glog.V(0).Infof("makeupDiff in commitCompact failed %v", e)
|
||||||
}
|
e = os.Remove(v.FileName() + ".cpd")
|
||||||
if e = os.Rename(v.FileName()+".cpx", v.FileName()+".idx"); e != nil {
|
if e != nil {
|
||||||
return e
|
return e
|
||||||
|
}
|
||||||
|
e = os.Remove(v.FileName() + ".cpx")
|
||||||
|
if e != nil {
|
||||||
|
return e
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
var e error
|
||||||
|
if e = os.Rename(v.FileName()+".cpd", v.FileName()+".dat"); e != nil {
|
||||||
|
return e
|
||||||
|
}
|
||||||
|
if e = os.Rename(v.FileName()+".cpx", v.FileName()+".idx"); e != nil {
|
||||||
|
return e
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
//glog.V(3).Infof("Pretending to be vacuuming...")
|
//glog.V(3).Infof("Pretending to be vacuuming...")
|
||||||
//time.Sleep(20 * time.Second)
|
//time.Sleep(20 * time.Second)
|
||||||
glog.V(3).Infof("Loading Commit file...")
|
glog.V(3).Infof("Loading Commit file...")
|
||||||
|
@ -55,7 +72,138 @@ func (v *Volume) commitCompact() error {
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
func makeupDiff(newDatFile, newIdxFile, oldDatFile, oldIdxFile string) (err error) {
|
func fetchCompactRevisionFromDatFile(file *os.File) (compactRevision uint16, err error) {
|
||||||
|
if _, err = file.Seek(0, 0); err != nil {
|
||||||
|
return 0, fmt.Errorf("cannot seek to the beginning of %s: %v", file.Name(), err)
|
||||||
|
}
|
||||||
|
header := make([]byte, SuperBlockSize)
|
||||||
|
if _, e := file.Read(header); e != nil {
|
||||||
|
return 0, fmt.Errorf("cannot read file %s 's super block: %v", file.Name(), e)
|
||||||
|
}
|
||||||
|
superBlock, err := ParseSuperBlock(header)
|
||||||
|
if err != nil {
|
||||||
|
return 0, err
|
||||||
|
}
|
||||||
|
return superBlock.CompactRevision, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (v *Volume) makeupDiff(newDatFileName, newIdxFileName, oldDatFileName, oldIdxFileName string) (err error) {
|
||||||
|
var indexSize int64
|
||||||
|
|
||||||
|
oldIdxFile, err := os.Open(oldIdxFileName)
|
||||||
|
defer oldIdxFile.Close()
|
||||||
|
|
||||||
|
oldDatFile, err := os.Open(oldDatFileName)
|
||||||
|
defer oldDatFile.Close()
|
||||||
|
|
||||||
|
if indexSize, err = verifyIndexFileIntegrity(oldIdxFile); err != nil {
|
||||||
|
return fmt.Errorf("verifyIndexFileIntegrity %s failed: %v", oldIdxFileName, err)
|
||||||
|
}
|
||||||
|
if indexSize == 0 || uint64(indexSize) <= v.lastCompactIndexOffset {
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
oldDatCompactRevision, err := fetchCompactRevisionFromDatFile(oldDatFile)
|
||||||
|
if err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
if oldDatCompactRevision != v.lastCompactRevision {
|
||||||
|
return fmt.Errorf("current old dat file's compact revision %d is not the expected one %d", oldDatCompactRevision, v.lastCompactRevision)
|
||||||
|
}
|
||||||
|
|
||||||
|
type keyField struct {
|
||||||
|
offset uint32
|
||||||
|
size uint32
|
||||||
|
}
|
||||||
|
incrementedHasUpdatedIndexEntry := make(map[uint64]keyField)
|
||||||
|
|
||||||
|
for idx_offset := indexSize - NeedleIndexSize; uint64(idx_offset) >= v.lastCompactIndexOffset; idx_offset -= NeedleIndexSize {
|
||||||
|
var IdxEntry []byte
|
||||||
|
if IdxEntry, err = readIndexEntryAtOffset(oldIdxFile, idx_offset); err != nil {
|
||||||
|
return fmt.Errorf("readIndexEntry %s at offset %d failed: %v", oldIdxFileName, idx_offset, err)
|
||||||
|
}
|
||||||
|
key, offset, size := idxFileEntry(IdxEntry)
|
||||||
|
if _, found := incrementedHasUpdatedIndexEntry[key]; !found {
|
||||||
|
incrementedHasUpdatedIndexEntry[key] = keyField{
|
||||||
|
offset: offset,
|
||||||
|
size: size,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if len(incrementedHasUpdatedIndexEntry) > 0 {
|
||||||
|
var (
|
||||||
|
dst, idx *os.File
|
||||||
|
)
|
||||||
|
if dst, err = os.OpenFile(newDatFileName, os.O_RDWR, 0644); err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
defer dst.Close()
|
||||||
|
|
||||||
|
if idx, err = os.OpenFile(newIdxFileName, os.O_RDWR, 0644); err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
defer idx.Close()
|
||||||
|
|
||||||
|
var newDatCompactRevision uint16
|
||||||
|
newDatCompactRevision, err = fetchCompactRevisionFromDatFile(dst)
|
||||||
|
if err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
if oldDatCompactRevision+1 != newDatCompactRevision {
|
||||||
|
return fmt.Errorf("oldDatFile %s 's compact revision is %d while newDatFile %s 's compact revision is %d", oldDatFileName, oldDatCompactRevision, newDatFileName, newDatCompactRevision)
|
||||||
|
}
|
||||||
|
|
||||||
|
idx_entry_bytes := make([]byte, 16)
|
||||||
|
for key, incre_idx_entry := range incrementedHasUpdatedIndexEntry {
|
||||||
|
util.Uint64toBytes(idx_entry_bytes[0:8], key)
|
||||||
|
util.Uint32toBytes(idx_entry_bytes[8:12], incre_idx_entry.offset)
|
||||||
|
util.Uint32toBytes(idx_entry_bytes[12:16], incre_idx_entry.size)
|
||||||
|
|
||||||
|
var offset int64
|
||||||
|
if offset, err = dst.Seek(0, 2); err != nil {
|
||||||
|
glog.V(0).Infof("failed to seek the end of file: %v", err)
|
||||||
|
return
|
||||||
|
}
|
||||||
|
//ensure file writing starting from aligned positions
|
||||||
|
if offset%NeedlePaddingSize != 0 {
|
||||||
|
offset = offset + (NeedlePaddingSize - offset%NeedlePaddingSize)
|
||||||
|
if offset, err = v.dataFile.Seek(offset, 0); err != nil {
|
||||||
|
glog.V(0).Infof("failed to align in datafile %s: %v", v.dataFile.Name(), err)
|
||||||
|
return
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
//updated needle
|
||||||
|
if incre_idx_entry.offset != 0 && incre_idx_entry.size != 0 {
|
||||||
|
//even the needle cache in memory is hit, the need_bytes is correct
|
||||||
|
var needle_bytes []byte
|
||||||
|
needle_bytes, _, err = ReadNeedleBlob(oldDatFile, int64(incre_idx_entry.offset)*NeedlePaddingSize, incre_idx_entry.size)
|
||||||
|
if err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
dst.Write(needle_bytes)
|
||||||
|
util.Uint32toBytes(idx_entry_bytes[8:12], uint32(offset/NeedlePaddingSize))
|
||||||
|
} else { //deleted needle
|
||||||
|
//fakeDelNeedle 's default Data field is nil
|
||||||
|
fakeDelNeedle := new(Needle)
|
||||||
|
fakeDelNeedle.Id = key
|
||||||
|
fakeDelNeedle.Cookie = 0x12345678
|
||||||
|
_, err = fakeDelNeedle.Append(dst, v.Version())
|
||||||
|
if err != nil {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
util.Uint32toBytes(idx_entry_bytes[8:12], uint32(0))
|
||||||
|
}
|
||||||
|
|
||||||
|
if _, err := idx.Seek(0, 2); err != nil {
|
||||||
|
return fmt.Errorf("cannot seek end of indexfile %s: %v",
|
||||||
|
newIdxFileName, err)
|
||||||
|
}
|
||||||
|
_, err = idx.Write(idx_entry_bytes)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
55
weed/storage/volume_vacuum_test.go
Normal file
55
weed/storage/volume_vacuum_test.go
Normal file
|
@ -0,0 +1,55 @@
|
||||||
|
package storage
|
||||||
|
|
||||||
|
import (
|
||||||
|
"testing"
|
||||||
|
)
|
||||||
|
|
||||||
|
/*
|
||||||
|
makediff test steps
|
||||||
|
1. launch weed server at your local/dev environment, (option
|
||||||
|
"garbageThreshold" for master and option "max" for volume should be set with specific value which would let
|
||||||
|
preparing test prerequisite easier )
|
||||||
|
a) ./weed master -garbageThreshold=0.99 -mdir=./m
|
||||||
|
b) ./weed volume -dir=./data -max=1 -mserver=localhost:9333 -port=8080
|
||||||
|
2. upload 4 different files, you could call dir/assign to get 4 different fids
|
||||||
|
a) upload file A with fid a
|
||||||
|
b) upload file B with fid b
|
||||||
|
c) upload file C with fid c
|
||||||
|
d) upload file D with fid d
|
||||||
|
3. update file A and C
|
||||||
|
a) modify file A and upload file A with fid a
|
||||||
|
b) modify file C and upload file C with fid c
|
||||||
|
c) record the current 1.idx's file size(lastCompactIndexOffset value)
|
||||||
|
4. Compacting the data file
|
||||||
|
a) run curl http://localhost:8080/admin/vacuum/compact?volumeId=1
|
||||||
|
b) verify the 1.cpd and 1.cpx is created under volume directory
|
||||||
|
5. update file B and delete file D
|
||||||
|
a) modify file B and upload file B with fid b
|
||||||
|
d) delete file B with fid b
|
||||||
|
6. Now you could run the following UT case, the case should be run successfully
|
||||||
|
7. Compact commit manually
|
||||||
|
a) mv 1.cpd 1.dat
|
||||||
|
b) mv 1.cpx 1.idx
|
||||||
|
8. Restart Volume Server
|
||||||
|
9. Now you should get updated file A,B,C
|
||||||
|
*/
|
||||||
|
|
||||||
|
func TestMakeDiff(t *testing.T) {
|
||||||
|
|
||||||
|
v := new(Volume)
|
||||||
|
//lastCompactIndexOffset value is the index file size before step 4
|
||||||
|
v.lastCompactIndexOffset = 96
|
||||||
|
v.SuperBlock.version = 0x2
|
||||||
|
/*
|
||||||
|
err := v.makeupDiff(
|
||||||
|
"/yourpath/1.cpd",
|
||||||
|
"/yourpath/1.cpx",
|
||||||
|
"/yourpath/1.dat",
|
||||||
|
"/yourpath/1.idx")
|
||||||
|
if err != nil {
|
||||||
|
t.Errorf("makeupDiff err is %v", err)
|
||||||
|
} else {
|
||||||
|
t.Log("makeupDiff Succeeded")
|
||||||
|
}
|
||||||
|
*/
|
||||||
|
}
|
Loading…
Reference in a new issue