Commit 6e8825f9 authored by Jacob Vosmaer's avatar Jacob Vosmaer

Merge branch 'eb-new-upload-metadata' into 'master'

Include upload_duration in finalized fields

See merge request gitlab-org/gitlab!71501
parents 45bfa8c6 59cc9289
# frozen_string_literal: true
module Gitlab
module Instrumentation
class Uploads
UPLOAD_DURATION = :uploaded_file_upload_duration_s
UPLOADED_FILE_SIZE = :uploaded_file_size_bytes
def self.track(uploaded_file)
if ::Gitlab::SafeRequestStore.active?
::Gitlab::SafeRequestStore[UPLOAD_DURATION] = uploaded_file.upload_duration
::Gitlab::SafeRequestStore[UPLOADED_FILE_SIZE] = uploaded_file.size
end
end
def self.get_upload_duration
::Gitlab::SafeRequestStore[UPLOAD_DURATION]
end
def self.get_uploaded_file_size
::Gitlab::SafeRequestStore[UPLOADED_FILE_SIZE]
end
def self.payload
{
UPLOAD_DURATION => get_upload_duration,
UPLOADED_FILE_SIZE => get_uploaded_file_size
}.compact
end
end
end
end
...@@ -31,6 +31,7 @@ module Gitlab ...@@ -31,6 +31,7 @@ module Gitlab
instrument_thread_memory_allocations(payload) instrument_thread_memory_allocations(payload)
instrument_load_balancing(payload) instrument_load_balancing(payload)
instrument_pid(payload) instrument_pid(payload)
instrument_uploads(payload)
end end
def instrument_gitaly(payload) def instrument_gitaly(payload)
...@@ -116,6 +117,10 @@ module Gitlab ...@@ -116,6 +117,10 @@ module Gitlab
payload.merge!(load_balancing_payload) payload.merge!(load_balancing_payload)
end end
def instrument_uploads(payload)
payload.merge! ::Gitlab::Instrumentation::Uploads.payload
end
# Returns the queuing duration for a Sidekiq job in seconds, as a float, if the # Returns the queuing duration for a Sidekiq job in seconds, as a float, if the
# `enqueued_at` field or `created_at` field is available. # `enqueued_at` field or `created_at` field is available.
# #
......
...@@ -20,8 +20,9 @@ class UploadedFile ...@@ -20,8 +20,9 @@ class UploadedFile
attr_reader :remote_id attr_reader :remote_id
attr_reader :sha256 attr_reader :sha256
attr_reader :size attr_reader :size
attr_reader :upload_duration
def initialize(path, filename: nil, content_type: "application/octet-stream", sha256: nil, remote_id: nil, size: nil) def initialize(path, filename: nil, content_type: "application/octet-stream", sha256: nil, remote_id: nil, size: nil, upload_duration: nil)
if path.present? if path.present?
raise InvalidPathError, "#{path} file does not exist" unless ::File.exist?(path) raise InvalidPathError, "#{path} file does not exist" unless ::File.exist?(path)
...@@ -35,6 +36,12 @@ class UploadedFile ...@@ -35,6 +36,12 @@ class UploadedFile
end end
end end
begin
@upload_duration = Float(upload_duration)
rescue ArgumentError, TypeError
@upload_duration = 0
end
@content_type = content_type @content_type = content_type
@original_filename = sanitize_filename(filename || path || '') @original_filename = sanitize_filename(filename || path || '')
@content_type = content_type @content_type = content_type
...@@ -64,8 +71,11 @@ class UploadedFile ...@@ -64,8 +71,11 @@ class UploadedFile
content_type: params['type'] || 'application/octet-stream', content_type: params['type'] || 'application/octet-stream',
sha256: params['sha256'], sha256: params['sha256'],
remote_id: remote_id, remote_id: remote_id,
size: params['size'] size: params['size'],
) upload_duration: params['upload_duration']
).tap do |uploaded_file|
::Gitlab::Instrumentation::Uploads.track(uploaded_file)
end
end end
def self.allowed_path?(file_path, paths) def self.allowed_path?(file_path, paths)
......
...@@ -147,6 +147,25 @@ RSpec.describe Gitlab::InstrumentationHelper do ...@@ -147,6 +147,25 @@ RSpec.describe Gitlab::InstrumentationHelper do
expect(payload).not_to include(:caught_up_replica_pick_fail) expect(payload).not_to include(:caught_up_replica_pick_fail)
end end
end end
context 'when there is an uploaded file' do
it 'adds upload data' do
uploaded_file = UploadedFile.from_params({
'name' => 'dir/foo.txt',
'sha256' => 'sha256',
'remote_url' => 'http://localhost/file',
'remote_id' => '1234567890',
'etag' => 'etag1234567890',
'upload_duration' => '5.05',
'size' => '123456'
}, nil)
subject
expect(payload[:uploaded_file_upload_duration_s]).to eq(uploaded_file.upload_duration)
expect(payload[:uploaded_file_size_bytes]).to eq(uploaded_file.size)
end
end
end end
describe 'duration calculations' do describe 'duration calculations' do
......
...@@ -15,7 +15,7 @@ RSpec.describe UploadedFile do ...@@ -15,7 +15,7 @@ RSpec.describe UploadedFile do
end end
context 'from_params functions' do context 'from_params functions' do
RSpec.shared_examples 'using the file path' do |filename:, content_type:, sha256:, path_suffix:| RSpec.shared_examples 'using the file path' do |filename:, content_type:, sha256:, path_suffix:, upload_duration:|
it { is_expected.not_to be_nil } it { is_expected.not_to be_nil }
it 'sets properly the attributes' do it 'sets properly the attributes' do
...@@ -24,6 +24,7 @@ RSpec.describe UploadedFile do ...@@ -24,6 +24,7 @@ RSpec.describe UploadedFile do
expect(subject.sha256).to eq(sha256) expect(subject.sha256).to eq(sha256)
expect(subject.remote_id).to be_nil expect(subject.remote_id).to be_nil
expect(subject.path).to end_with(path_suffix) expect(subject.path).to end_with(path_suffix)
expect(subject.upload_duration).to eq(upload_duration)
end end
it 'handles a blank path' do it 'handles a blank path' do
...@@ -37,16 +38,17 @@ RSpec.describe UploadedFile do ...@@ -37,16 +38,17 @@ RSpec.describe UploadedFile do
end end
end end
RSpec.shared_examples 'using the remote id' do |filename:, content_type:, sha256:, size:, remote_id:| RSpec.shared_examples 'using the remote id' do |filename:, content_type:, sha256:, size:, remote_id:, upload_duration:|
it { is_expected.not_to be_nil } it { is_expected.not_to be_nil }
it 'sets properly the attributes' do it 'sets properly the attributes' do
expect(subject.original_filename).to eq(filename) expect(subject.original_filename).to eq(filename)
expect(subject.content_type).to eq('application/octet-stream') expect(subject.content_type).to eq(content_type)
expect(subject.sha256).to eq('sha256') expect(subject.sha256).to eq(sha256)
expect(subject.path).to be_nil expect(subject.path).to be_nil
expect(subject.size).to eq(123456) expect(subject.size).to eq(size)
expect(subject.remote_id).to eq('1234567890') expect(subject.remote_id).to eq(remote_id)
expect(subject.upload_duration).to eq(upload_duration)
end end
end end
...@@ -78,6 +80,7 @@ RSpec.describe UploadedFile do ...@@ -78,6 +80,7 @@ RSpec.describe UploadedFile do
{ 'path' => temp_file.path, { 'path' => temp_file.path,
'name' => 'dir/my file&.txt', 'name' => 'dir/my file&.txt',
'type' => 'my/type', 'type' => 'my/type',
'upload_duration' => '5.05',
'sha256' => 'sha256' } 'sha256' => 'sha256' }
end end
...@@ -85,7 +88,8 @@ RSpec.describe UploadedFile do ...@@ -85,7 +88,8 @@ RSpec.describe UploadedFile do
filename: 'my_file_.txt', filename: 'my_file_.txt',
content_type: 'my/type', content_type: 'my/type',
sha256: 'sha256', sha256: 'sha256',
path_suffix: 'test' path_suffix: 'test',
upload_duration: 5.05
end end
context 'with a remote id' do context 'with a remote id' do
...@@ -96,6 +100,7 @@ RSpec.describe UploadedFile do ...@@ -96,6 +100,7 @@ RSpec.describe UploadedFile do
'remote_url' => 'http://localhost/file', 'remote_url' => 'http://localhost/file',
'remote_id' => '1234567890', 'remote_id' => '1234567890',
'etag' => 'etag1234567890', 'etag' => 'etag1234567890',
'upload_duration' => '5.05',
'size' => '123456' 'size' => '123456'
} }
end end
...@@ -105,7 +110,8 @@ RSpec.describe UploadedFile do ...@@ -105,7 +110,8 @@ RSpec.describe UploadedFile do
content_type: 'application/octet-stream', content_type: 'application/octet-stream',
sha256: 'sha256', sha256: 'sha256',
size: 123456, size: 123456,
remote_id: '1234567890' remote_id: '1234567890',
upload_duration: 5.05
end end
context 'with a path and a remote id' do context 'with a path and a remote id' do
...@@ -117,6 +123,7 @@ RSpec.describe UploadedFile do ...@@ -117,6 +123,7 @@ RSpec.describe UploadedFile do
'remote_url' => 'http://localhost/file', 'remote_url' => 'http://localhost/file',
'remote_id' => '1234567890', 'remote_id' => '1234567890',
'etag' => 'etag1234567890', 'etag' => 'etag1234567890',
'upload_duration' => '5.05',
'size' => '123456' 'size' => '123456'
} }
end end
...@@ -126,7 +133,8 @@ RSpec.describe UploadedFile do ...@@ -126,7 +133,8 @@ RSpec.describe UploadedFile do
content_type: 'application/octet-stream', content_type: 'application/octet-stream',
sha256: 'sha256', sha256: 'sha256',
size: 123456, size: 123456,
remote_id: '1234567890' remote_id: '1234567890',
upload_duration: 5.05
end end
end end
end end
...@@ -216,6 +224,44 @@ RSpec.describe UploadedFile do ...@@ -216,6 +224,44 @@ RSpec.describe UploadedFile do
end.to raise_error(UploadedFile::UnknownSizeError, 'Unable to determine file size') end.to raise_error(UploadedFile::UnknownSizeError, 'Unable to determine file size')
end end
end end
context 'when upload_duration is not provided' do
it 'sets upload_duration to zero' do
file = described_class.new(temp_file.path)
expect(file.upload_duration).to be_zero
end
end
context 'when upload_duration is provided' do
let(:file) { described_class.new(temp_file.path, upload_duration: duration) }
context 'and upload_duration is a number' do
let(:duration) { 5.505 }
it 'sets the upload_duration' do
expect(file.upload_duration).to eq(duration)
end
end
context 'and upload_duration is a string' do
context 'and represents a number' do
let(:duration) { '5.505' }
it 'converts upload_duration to a number' do
expect(file.upload_duration).to eq(duration.to_f)
end
end
context 'and does not represent a number' do
let(:duration) { 'not a number' }
it 'sets upload_duration to zero' do
expect(file.upload_duration).to be_zero
end
end
end
end
end end
describe '#sanitize_filename' do describe '#sanitize_filename' do
......
...@@ -43,6 +43,9 @@ type FileHandler struct { ...@@ -43,6 +43,9 @@ type FileHandler struct {
// a map containing different hashes // a map containing different hashes
hashes map[string]string hashes map[string]string
// Duration of upload in seconds
uploadDuration float64
} }
type uploadClaims struct { type uploadClaims struct {
...@@ -74,11 +77,12 @@ func (fh *FileHandler) GitLabFinalizeFields(prefix string) (map[string]string, e ...@@ -74,11 +77,12 @@ func (fh *FileHandler) GitLabFinalizeFields(prefix string) (map[string]string, e
} }
for k, v := range map[string]string{ for k, v := range map[string]string{
"name": fh.Name, "name": fh.Name,
"path": fh.LocalPath, "path": fh.LocalPath,
"remote_url": fh.RemoteURL, "remote_url": fh.RemoteURL,
"remote_id": fh.RemoteID, "remote_id": fh.RemoteID,
"size": strconv.FormatInt(fh.Size, 10), "size": strconv.FormatInt(fh.Size, 10),
"upload_duration": strconv.FormatFloat(fh.uploadDuration, 'f', -1, 64),
} { } {
data[key(k)] = v data[key(k)] = v
signedData[k] = v signedData[k] = v
...@@ -105,18 +109,20 @@ type consumer interface { ...@@ -105,18 +109,20 @@ type consumer interface {
// SaveFileFromReader persists the provided reader content to all the location specified in opts. A cleanup will be performed once ctx is Done // SaveFileFromReader persists the provided reader content to all the location specified in opts. A cleanup will be performed once ctx is Done
// Make sure the provided context will not expire before finalizing upload with GitLab Rails. // Make sure the provided context will not expire before finalizing upload with GitLab Rails.
func SaveFileFromReader(ctx context.Context, reader io.Reader, size int64, opts *SaveFileOpts) (fh *FileHandler, err error) { func SaveFileFromReader(ctx context.Context, reader io.Reader, size int64, opts *SaveFileOpts) (*FileHandler, error) {
var uploadDestination consumer fh := &FileHandler{
fh = &FileHandler{
Name: opts.TempFilePrefix, Name: opts.TempFilePrefix,
RemoteID: opts.RemoteID, RemoteID: opts.RemoteID,
RemoteURL: opts.RemoteURL, RemoteURL: opts.RemoteURL,
} }
uploadStartTime := time.Now()
defer func() { fh.uploadDuration = time.Since(uploadStartTime).Seconds() }()
hashes := newMultiHash() hashes := newMultiHash()
reader = io.TeeReader(reader, hashes.Writer) reader = io.TeeReader(reader, hashes.Writer)
var clientMode string var clientMode string
var uploadDestination consumer
var err error
switch { switch {
case opts.IsLocal(): case opts.IsLocal():
clientMode = "local" clientMode = "local"
...@@ -161,23 +167,19 @@ func SaveFileFromReader(ctx context.Context, reader io.Reader, size int64, opts ...@@ -161,23 +167,19 @@ func SaveFileFromReader(ctx context.Context, reader io.Reader, size int64, opts
return nil, err return nil, err
} }
var hlr *hardLimitReader
if opts.MaximumSize > 0 { if opts.MaximumSize > 0 {
if size > opts.MaximumSize { if size > opts.MaximumSize {
return nil, SizeError(fmt.Errorf("the upload size %d is over maximum of %d bytes", size, opts.MaximumSize)) return nil, SizeError(fmt.Errorf("the upload size %d is over maximum of %d bytes", size, opts.MaximumSize))
} }
hlr := &hardLimitReader{r: reader, n: opts.MaximumSize} hlr = &hardLimitReader{r: reader, n: opts.MaximumSize}
reader = hlr reader = hlr
defer func() {
if hlr.n < 0 {
err = ErrEntityTooLarge
}
}()
} }
fh.Size, err = uploadDestination.Consume(ctx, reader, opts.Deadline) fh.Size, err = uploadDestination.Consume(ctx, reader, opts.Deadline)
if err != nil { if err != nil {
if err == objectstore.ErrNotEnoughParts { if (err == objectstore.ErrNotEnoughParts) || (hlr != nil && hlr.n < 0) {
err = ErrEntityTooLarge err = ErrEntityTooLarge
} }
return nil, err return nil, err
......
...@@ -548,4 +548,5 @@ func checkFileHandlerWithFields(t *testing.T, fh *filestore.FileHandler, fields ...@@ -548,4 +548,5 @@ func checkFileHandlerWithFields(t *testing.T, fh *filestore.FileHandler, fields
require.Equal(t, test.ObjectSHA1, fields[key("sha1")]) require.Equal(t, test.ObjectSHA1, fields[key("sha1")])
require.Equal(t, test.ObjectSHA256, fields[key("sha256")]) require.Equal(t, test.ObjectSHA256, fields[key("sha256")])
require.Equal(t, test.ObjectSHA512, fields[key("sha512")]) require.Equal(t, test.ObjectSHA512, fields[key("sha512")])
require.NotEmpty(t, fields[key("upload_duration")])
} }
...@@ -114,7 +114,7 @@ func TestUploadHandlerRewritingMultiPartData(t *testing.T) { ...@@ -114,7 +114,7 @@ func TestUploadHandlerRewritingMultiPartData(t *testing.T) {
require.Equal(t, hash, r.FormValue("file."+algo), "file hash %s", algo) require.Equal(t, hash, r.FormValue("file."+algo), "file hash %s", algo)
} }
require.Len(t, r.MultipartForm.Value, 11, "multipart form values") require.Len(t, r.MultipartForm.Value, 12, "multipart form values")
w.WriteHeader(202) w.WriteHeader(202)
fmt.Fprint(w, "RESPONSE") fmt.Fprint(w, "RESPONSE")
......
...@@ -83,7 +83,7 @@ func uploadTestServer(t *testing.T, authorizeTests func(r *http.Request), extraT ...@@ -83,7 +83,7 @@ func uploadTestServer(t *testing.T, authorizeTests func(r *http.Request), extraT
require.NoError(t, r.ParseMultipartForm(100000)) require.NoError(t, r.ParseMultipartForm(100000))
const nValues = 10 // file name, path, remote_url, remote_id, size, md5, sha1, sha256, sha512, gitlab-workhorse-upload for just the upload (no metadata because we are not POSTing a valid zip file) const nValues = 11 // file name, path, remote_url, remote_id, size, md5, sha1, sha256, sha512, upload_duration, gitlab-workhorse-upload for just the upload (no metadata because we are not POSTing a valid zip file)
require.Len(t, r.MultipartForm.Value, nValues) require.Len(t, r.MultipartForm.Value, nValues)
require.Empty(t, r.MultipartForm.File, "multipart form files") require.Empty(t, r.MultipartForm.File, "multipart form files")
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment