# frozen_string_literal: true module BulkImports class FileDownloadService FILE_SIZE_LIMIT = 5.gigabytes ALLOWED_CONTENT_TYPES = %w(application/gzip application/octet-stream).freeze ServiceError = Class.new(StandardError) def initialize(configuration:, relative_url:, dir:, filename:) @configuration = configuration @relative_url = relative_url @filename = filename @dir = dir @filepath = File.join(@dir, @filename) end def execute validate_dir validate_url validate_content_type validate_content_length download_file validate_symlink filepath end private attr_reader :configuration, :relative_url, :dir, :filename, :filepath def download_file File.open(filepath, 'wb') do |file| bytes_downloaded = 0 http_client.stream(relative_url) do |chunk| bytes_downloaded += chunk.size raise(ServiceError, 'Invalid downloaded file') if bytes_downloaded > FILE_SIZE_LIMIT raise(ServiceError, "File download error #{chunk.code}") unless chunk.code == 200 file.write(chunk) end end rescue StandardError => e File.delete(filepath) if File.exist?(filepath) raise e end def http_client @http_client ||= BulkImports::Clients::HTTP.new( uri: configuration.url, token: configuration.access_token ) end def allow_local_requests? ::Gitlab::CurrentSettings.allow_local_requests_from_web_hooks_and_services? end def headers @headers ||= http_client.head(relative_url).headers end def validate_dir raise(ServiceError, 'Invalid target directory') unless dir.start_with?(Dir.tmpdir) end def validate_symlink if File.lstat(filepath).symlink? File.delete(filepath) raise(ServiceError, 'Invalid downloaded file') end end def validate_url ::Gitlab::UrlBlocker.validate!( http_client.resource_url(relative_url), allow_localhost: allow_local_requests?, allow_local_network: allow_local_requests?, schemes: %w(http https) ) end def validate_content_length content_size = headers['content-length'] raise(ServiceError, 'Invalid content length') if content_size.blank? || content_size.to_i > FILE_SIZE_LIMIT end def validate_content_type content_type = headers['content-type'] raise(ServiceError, 'Invalid content type') if content_type.blank? || ALLOWED_CONTENT_TYPES.exclude?(content_type) end end end