mirror of
https://github.com/seaweedfs/seaweedfs.git
synced 2024-01-19 02:48:24 +00:00
arangodb s3 bucket name compatibility (#3588)
* Update arangodb_store.go * update readme, properly escape queries, add name patching * use underscore * use underscore * better comment * fix readme Co-authored-by: a <a@a.a>
This commit is contained in:
parent
10d545060f
commit
48db56ddad
|
@ -66,8 +66,8 @@ func (store *ArangodbStore) Initialize(configuration util.Configuration, prefix
|
||||||
}
|
}
|
||||||
|
|
||||||
func (store *ArangodbStore) connection(uris []string, user string, pass string, insecure bool) (err error) {
|
func (store *ArangodbStore) connection(uris []string, user string, pass string, insecure bool) (err error) {
|
||||||
ctx, _ := context.WithTimeout(context.Background(), 10*time.Second)
|
ctx, cn := context.WithTimeout(context.Background(), 10*time.Second)
|
||||||
|
defer cn()
|
||||||
store.connect, err = http.NewConnection(http.ConnectionConfig{
|
store.connect, err = http.NewConnection(http.ConnectionConfig{
|
||||||
Endpoints: uris,
|
Endpoints: uris,
|
||||||
TLSConfig: &tls.Config{
|
TLSConfig: &tls.Config{
|
||||||
|
@ -274,10 +274,10 @@ func (store *ArangodbStore) DeleteFolderChildren(ctx context.Context, fullpath u
|
||||||
for d in %s
|
for d in %s
|
||||||
filter starts_with(d.directory, "%s/") || d.directory == "%s"
|
filter starts_with(d.directory, "%s/") || d.directory == "%s"
|
||||||
remove d._key in %s`,
|
remove d._key in %s`,
|
||||||
targetCollection.Name(),
|
"`"+targetCollection.Name()+"`",
|
||||||
strings.Join(strings.Split(string(fullpath), "/"), ","),
|
strings.Join(strings.Split(string(fullpath), "/"), ","),
|
||||||
string(fullpath),
|
string(fullpath),
|
||||||
targetCollection.Name(),
|
"`"+targetCollection.Name()+"`",
|
||||||
)
|
)
|
||||||
cur, err := store.database.Query(ctx, query, nil)
|
cur, err := store.database.Query(ctx, query, nil)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
|
@ -296,7 +296,7 @@ func (store *ArangodbStore) ListDirectoryPrefixedEntries(ctx context.Context, di
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return lastFileName, err
|
return lastFileName, err
|
||||||
}
|
}
|
||||||
query := "for d in " + targetCollection.Name()
|
query := "for d in " + "`" + targetCollection.Name() + "`"
|
||||||
if includeStartFile {
|
if includeStartFile {
|
||||||
query = query + " filter d.name >= \"" + startFileName + "\" "
|
query = query + " filter d.name >= \"" + startFileName + "\" "
|
||||||
} else {
|
} else {
|
||||||
|
|
|
@ -98,8 +98,26 @@ func (store *ArangodbStore) ensureBucket(ctx context.Context, bucket string) (bc
|
||||||
return store.buckets[bucket], nil
|
return store.buckets[bucket], nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// transform to an arango compliant name
|
||||||
|
func bucketToCollectionName(s string) string {
|
||||||
|
if len(s) == 0 {
|
||||||
|
return ""
|
||||||
|
}
|
||||||
|
// replace all "." with _
|
||||||
|
s = strings.ReplaceAll(s, ".", "_")
|
||||||
|
|
||||||
|
// if starts with number or '.' then add a special prefix
|
||||||
|
if (s[0] >= '0' && s[0] <= '9') || (s[0] == '.' || s[0] == '_' || s[0] == '-') {
|
||||||
|
s = "xN--" + s
|
||||||
|
}
|
||||||
|
return s
|
||||||
|
}
|
||||||
|
|
||||||
// creates collection if not exist, ensures indices if not exist
|
// creates collection if not exist, ensures indices if not exist
|
||||||
func (store *ArangodbStore) ensureCollection(ctx context.Context, name string) (c driver.Collection, err error) {
|
func (store *ArangodbStore) ensureCollection(ctx context.Context, bucket_name string) (c driver.Collection, err error) {
|
||||||
|
// convert the bucket to collection name
|
||||||
|
name := bucketToCollectionName(bucket_name)
|
||||||
|
|
||||||
ok, err := store.database.CollectionExists(ctx, name)
|
ok, err := store.database.CollectionExists(ctx, name)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return
|
return
|
||||||
|
|
|
@ -22,6 +22,39 @@ i test using this dev database:
|
||||||
`docker run -p 8529:8529 -e ARANGO_ROOT_PASSWORD=test arangodb/arangodb:3.9.0`
|
`docker run -p 8529:8529 -e ARANGO_ROOT_PASSWORD=test arangodb/arangodb:3.9.0`
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
## database structure
|
||||||
|
|
||||||
|
|
||||||
|
arangodb has a few restrictions which require the use of a few tricks in order to losslessly store the data.
|
||||||
|
|
||||||
|
### filer store
|
||||||
|
|
||||||
|
arangodb does not support []byte, and will store such as a uint64 array. this would be a waste of space. to counteract this, we store the data as a length prefixed uint64 byteset.
|
||||||
|
|
||||||
|
### filer kv
|
||||||
|
|
||||||
|
same as above
|
||||||
|
|
||||||
|
### filer buckets
|
||||||
|
|
||||||
|
s3 buckets are implemented through arangodb collection. this allows us to do very fast bucket deletion by simply deleting the collection
|
||||||
|
|
||||||
|
|
||||||
|
arangodb collection name rules is character set `azAZ09_-` with a 256 character max. however the first character must be a letter.
|
||||||
|
|
||||||
|
|
||||||
|
s3 bucket name rule is the set `azAZ09.-` with a 63 characters max.
|
||||||
|
|
||||||
|
the rules for collection names is then the following:
|
||||||
|
|
||||||
|
1. if the bucket name is a valid arangodb collection name, then nothing is done.
|
||||||
|
2. if the bucket name contains a ".", the "." is replaced with "_"
|
||||||
|
3. if the bucket name now begins with a number or "_", the prefix "xN--" is prepended to the collection name
|
||||||
|
|
||||||
|
this allows for these collection names to be used.
|
||||||
|
|
||||||
|
|
||||||
## features i don't personally need but are missing
|
## features i don't personally need but are missing
|
||||||
[ ] provide tls cert to arango
|
[ ] provide tls cert to arango
|
||||||
[ ] authentication that is not basic auth
|
[ ] authentication that is not basic auth
|
||||||
|
|
Loading…
Reference in a new issue