Skip to content

Commit

Permalink
s3: export PartSize parameter
Browse files Browse the repository at this point in the history
By default AWS SDK use part_size of 5 MB. For big files,
it is not ideal case. For Hadoop, it is not uncommon to
use 512 MB.
  • Loading branch information
murlock authored and drakkan committed Mar 13, 2020
1 parent 6b70f0b commit cdf1233
Show file tree
Hide file tree
Showing 5 changed files with 27 additions and 1 deletion.
2 changes: 2 additions & 0 deletions httpd/httpd_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -2010,6 +2010,7 @@ func TestWebUserS3Mock(t *testing.T) {
user.FsConfig.S3Config.Endpoint = "http://127.0.0.1:9000/path?a=b"
user.FsConfig.S3Config.StorageClass = "Standard"
user.FsConfig.S3Config.KeyPrefix = "somedir/subdir/"
user.FsConfig.S3Config.PartSize = 5
form := make(url.Values)
form.Set("username", user.Username)
form.Set("home_dir", user.HomeDir)
Expand All @@ -2034,6 +2035,7 @@ func TestWebUserS3Mock(t *testing.T) {
form.Set("s3_storage_class", user.FsConfig.S3Config.StorageClass)
form.Set("s3_endpoint", user.FsConfig.S3Config.Endpoint)
form.Set("s3_key_prefix", user.FsConfig.S3Config.KeyPrefix)
form.Set("s3_part_size", strconv.FormatInt(int64(user.FsConfig.S3Config.PartSize), 10))
form.Set("allowed_extensions", "/dir1::.jpg,.png")
form.Set("denied_extensions", "/dir2::.zip")
b, contentType, _ := getMultipartFormData(form, "", "")
Expand Down
4 changes: 4 additions & 0 deletions httpd/web.go
Original file line number Diff line number Diff line change
Expand Up @@ -329,6 +329,10 @@ func getFsConfigFromUserPostFields(r *http.Request) (dataprovider.Filesystem, er
fs.S3Config.Endpoint = r.Form.Get("s3_endpoint")
fs.S3Config.StorageClass = r.Form.Get("s3_storage_class")
fs.S3Config.KeyPrefix = r.Form.Get("s3_key_prefix")
fs.S3Config.PartSize, err = strconv.ParseInt(r.Form.Get("s3_part_size"), 10, 64)
if err != nil {
return fs, err
}
} else if fs.Provider == 2 {
fs.GCSConfig.Bucket = r.Form.Get("gcs_bucket")
fs.GCSConfig.StorageClass = r.Form.Get("gcs_storage_class")
Expand Down
11 changes: 10 additions & 1 deletion templates/user.html
Original file line number Diff line number Diff line change
Expand Up @@ -300,6 +300,15 @@ <h1 class="h5 mb-4 text-gray-800">{{if .IsAdd}}Add a new user{{else}}Edit user{{
</div>
</div>

<div class="form-group row s3">
<label for="idS3PartSize" class="col-sm-2 col-form-label">Part Size (MB)</label>
<div class="col-sm-3">
<input type="number" class="form-control" id="idS3PartSoze" name="s3_part_size" placeholder=""
value="{{.User.FsConfig.S3Config.PartSize}}" min="5">
</div>
<div class="col-sm-2"></div>
</div>

<div class="form-group row s3">
<label for="idS3KeyPrefix" class="col-sm-2 col-form-label">Key Prefix</label>
<div class="col-sm-10">
Expand Down Expand Up @@ -418,4 +427,4 @@ <h1 class="h5 mb-4 text-gray-800">{{if .IsAdd}}Add a new user{{else}}Edit user{{
}
}
</script>
{{end}}
{{end}}
8 changes: 8 additions & 0 deletions vfs/s3fs.go
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@ type S3FsConfig struct {
AccessSecret string `json:"access_secret,omitempty"`
Endpoint string `json:"endpoint,omitempty"`
StorageClass string `json:"storage_class,omitempty"`
PartSize int64 `json:"partsize,omitempty"`
}

// S3Fs is a Fs implementation for Amazon S3 compatible object storage.
Expand Down Expand Up @@ -81,6 +82,12 @@ func NewS3Fs(connectionID, localTempDir string, config S3FsConfig) (Fs, error) {
awsConfig.S3ForcePathStyle = aws.Bool(true)
}

if fs.config.PartSize == 0 {
fs.config.PartSize = s3manager.DefaultUploadPartSize
} else {
fs.config.PartSize *= 1024 * 1024
}

sessOpts := session.Options{
Config: *awsConfig,
SharedConfigState: session.SharedConfigEnable,
Expand Down Expand Up @@ -201,6 +208,7 @@ func (fs S3Fs) Create(name string, flag int) (*os.File, *pipeat.PipeWriterAt, fu
StorageClass: utils.NilIfEmpty(fs.config.StorageClass),
}, func(u *s3manager.Uploader) {
u.Concurrency = 2
u.PartSize = fs.config.PartSize
})
r.CloseWithError(err)
fsLog(fs, logger.LevelDebug, "upload completed, path: %#v, response: %v, readed bytes: %v, err: %v",
Expand Down
3 changes: 3 additions & 0 deletions vfs/vfs.go
Original file line number Diff line number Diff line change
Expand Up @@ -103,6 +103,9 @@ func ValidateS3FsConfig(config *S3FsConfig) error {
config.KeyPrefix += "/"
}
}
if config.PartSize != 0 && config.PartSize < 5 {
return errors.New("part_size ret cannot be lower than 5MB")
}
return nil
}

Expand Down

0 comments on commit cdf1233

Please sign in to comment.