2018-10-04 06:36:52 +00:00
|
|
|
package S3Sink
|
|
|
|
|
|
|
|
import (
|
2019-03-16 00:20:24 +00:00
|
|
|
"context"
|
2018-10-04 06:36:52 +00:00
|
|
|
"fmt"
|
2018-11-04 19:58:59 +00:00
|
|
|
"strings"
|
2018-10-06 20:04:33 +00:00
|
|
|
"sync"
|
2018-10-04 06:36:52 +00:00
|
|
|
|
2018-10-11 07:08:13 +00:00
|
|
|
"github.com/aws/aws-sdk-go/aws"
|
|
|
|
"github.com/aws/aws-sdk-go/aws/credentials"
|
2018-10-04 06:36:52 +00:00
|
|
|
"github.com/aws/aws-sdk-go/aws/session"
|
2018-10-11 07:08:13 +00:00
|
|
|
"github.com/aws/aws-sdk-go/service/s3"
|
|
|
|
"github.com/aws/aws-sdk-go/service/s3/s3iface"
|
2020-02-26 05:50:12 +00:00
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/filer"
|
2018-11-01 08:12:21 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
2018-10-11 07:08:13 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
|
2018-10-04 06:36:52 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/replication/sink"
|
2018-10-11 07:08:13 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/replication/source"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/util"
|
2018-10-04 06:36:52 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type S3Sink struct {
|
2021-03-01 00:19:03 +00:00
|
|
|
conn s3iface.S3API
|
|
|
|
region string
|
|
|
|
bucket string
|
|
|
|
dir string
|
|
|
|
endpoint string
|
|
|
|
filerSource *source.FilerSource
|
|
|
|
isIncremental bool
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
sink.Sinks = append(sink.Sinks, &S3Sink{})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s3sink *S3Sink) GetName() string {
|
2018-10-07 00:10:15 +00:00
|
|
|
return "s3"
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (s3sink *S3Sink) GetSinkToDirectory() string {
|
|
|
|
return s3sink.dir
|
|
|
|
}
|
|
|
|
|
2021-03-01 00:19:03 +00:00
|
|
|
func (s3sink *S3Sink) IsIncremental() bool {
|
|
|
|
return s3sink.isIncremental
|
|
|
|
}
|
|
|
|
|
2020-01-29 17:09:55 +00:00
|
|
|
func (s3sink *S3Sink) Initialize(configuration util.Configuration, prefix string) error {
|
|
|
|
glog.V(0).Infof("sink.s3.region: %v", configuration.GetString(prefix+"region"))
|
|
|
|
glog.V(0).Infof("sink.s3.bucket: %v", configuration.GetString(prefix+"bucket"))
|
|
|
|
glog.V(0).Infof("sink.s3.directory: %v", configuration.GetString(prefix+"directory"))
|
2020-04-08 00:49:00 +00:00
|
|
|
glog.V(0).Infof("sink.s3.endpoint: %v", configuration.GetString(prefix+"endpoint"))
|
2021-03-01 00:19:03 +00:00
|
|
|
glog.V(0).Infof("sink.s3.is_incremental: %v", configuration.GetString(prefix+"is_incremental"))
|
|
|
|
s3sink.isIncremental = configuration.GetBool(prefix + "is_incremental")
|
2018-10-04 06:36:52 +00:00
|
|
|
return s3sink.initialize(
|
2020-01-29 17:09:55 +00:00
|
|
|
configuration.GetString(prefix+"aws_access_key_id"),
|
|
|
|
configuration.GetString(prefix+"aws_secret_access_key"),
|
|
|
|
configuration.GetString(prefix+"region"),
|
|
|
|
configuration.GetString(prefix+"bucket"),
|
|
|
|
configuration.GetString(prefix+"directory"),
|
2020-04-08 00:49:00 +00:00
|
|
|
configuration.GetString(prefix+"endpoint"),
|
2018-10-04 06:36:52 +00:00
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s3sink *S3Sink) SetSourceFiler(s *source.FilerSource) {
|
|
|
|
s3sink.filerSource = s
|
|
|
|
}
|
|
|
|
|
2020-04-08 00:49:00 +00:00
|
|
|
func (s3sink *S3Sink) initialize(awsAccessKeyId, awsSecretAccessKey, region, bucket, dir, endpoint string) error {
|
2018-10-04 06:36:52 +00:00
|
|
|
s3sink.region = region
|
|
|
|
s3sink.bucket = bucket
|
|
|
|
s3sink.dir = dir
|
2020-04-08 00:49:00 +00:00
|
|
|
s3sink.endpoint = endpoint
|
2018-10-04 06:36:52 +00:00
|
|
|
|
|
|
|
config := &aws.Config{
|
2021-03-01 00:19:03 +00:00
|
|
|
Region: aws.String(s3sink.region),
|
|
|
|
Endpoint: aws.String(s3sink.endpoint),
|
2021-03-01 00:20:13 +00:00
|
|
|
S3ForcePathStyle: aws.Bool(true),
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
2019-11-19 03:24:34 +00:00
|
|
|
if awsAccessKeyId != "" && awsSecretAccessKey != "" {
|
|
|
|
config.Credentials = credentials.NewStaticCredentials(awsAccessKeyId, awsSecretAccessKey, "")
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
sess, err := session.NewSession(config)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("create aws session: %v", err)
|
|
|
|
}
|
|
|
|
s3sink.conn = s3.New(sess)
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-09-09 18:21:23 +00:00
|
|
|
func (s3sink *S3Sink) DeleteEntry(key string, isDirectory, deleteIncludeChunks bool, signatures []int32) error {
|
2018-10-04 06:36:52 +00:00
|
|
|
|
2018-11-04 19:58:59 +00:00
|
|
|
key = cleanKey(key)
|
|
|
|
|
2018-10-04 06:36:52 +00:00
|
|
|
if isDirectory {
|
|
|
|
key = key + "/"
|
|
|
|
}
|
|
|
|
|
|
|
|
return s3sink.deleteObject(key)
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2020-09-09 18:21:23 +00:00
|
|
|
func (s3sink *S3Sink) CreateEntry(key string, entry *filer_pb.Entry, signatures []int32) error {
|
2018-11-04 19:58:59 +00:00
|
|
|
key = cleanKey(key)
|
|
|
|
|
2018-10-04 08:14:44 +00:00
|
|
|
if entry.IsDirectory {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2018-10-04 06:36:52 +00:00
|
|
|
uploadId, err := s3sink.createMultipartUpload(key, entry)
|
|
|
|
if err != nil {
|
2021-03-01 00:19:03 +00:00
|
|
|
return fmt.Errorf("createMultipartUpload: %v", err)
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
totalSize := filer.FileSize(entry)
|
|
|
|
chunkViews := filer.ViewFromChunks(s3sink.filerSource.LookupFileId, entry.Chunks, 0, int64(totalSize))
|
2018-10-04 06:36:52 +00:00
|
|
|
|
2020-03-11 06:37:14 +00:00
|
|
|
parts := make([]*s3.CompletedPart, len(chunkViews))
|
|
|
|
|
2018-10-04 06:36:52 +00:00
|
|
|
var wg sync.WaitGroup
|
|
|
|
for chunkIndex, chunk := range chunkViews {
|
|
|
|
partId := chunkIndex + 1
|
|
|
|
wg.Add(1)
|
2020-09-01 07:21:19 +00:00
|
|
|
go func(chunk *filer.ChunkView, index int) {
|
2018-10-04 06:36:52 +00:00
|
|
|
defer wg.Done()
|
2020-02-26 06:23:59 +00:00
|
|
|
if part, uploadErr := s3sink.uploadPart(key, uploadId, partId, chunk); uploadErr != nil {
|
2018-10-04 06:36:52 +00:00
|
|
|
err = uploadErr
|
2021-03-01 00:19:03 +00:00
|
|
|
glog.Errorf("uploadPart: %v", uploadErr)
|
2018-10-04 06:36:52 +00:00
|
|
|
} else {
|
2020-03-11 06:37:14 +00:00
|
|
|
parts[index] = part
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
2020-03-11 06:37:14 +00:00
|
|
|
}(chunk, chunkIndex)
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
wg.Wait()
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
s3sink.abortMultipartUpload(key, uploadId)
|
2021-03-01 00:19:03 +00:00
|
|
|
return fmt.Errorf("uploadPart: %v", err)
|
2018-10-04 06:36:52 +00:00
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
return s3sink.completeMultipartUpload(context.Background(), key, uploadId, parts)
|
2018-10-04 06:36:52 +00:00
|
|
|
|
|
|
|
}
|
|
|
|
|
2020-09-09 18:21:23 +00:00
|
|
|
func (s3sink *S3Sink) UpdateEntry(key string, oldEntry *filer_pb.Entry, newParentPath string, newEntry *filer_pb.Entry, deleteIncludeChunks bool, signatures []int32) (foundExistingEntry bool, err error) {
|
2018-11-04 19:58:59 +00:00
|
|
|
key = cleanKey(key)
|
2018-10-04 06:36:52 +00:00
|
|
|
// TODO improve efficiency
|
|
|
|
return false, nil
|
|
|
|
}
|
2018-11-04 19:58:59 +00:00
|
|
|
|
|
|
|
func cleanKey(key string) string {
|
|
|
|
if strings.HasPrefix(key, "/") {
|
|
|
|
key = key[1:]
|
|
|
|
}
|
|
|
|
return key
|
|
|
|
}
|