Support streaming downloads from Google Cloud Storage

This commit is contained in:
George Claghorn 2018-05-01 23:20:56 -04:00 committed by GitHub
parent db7416cda0
commit bf5f41d948
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
5 changed files with 50 additions and 31 deletions

@ -85,7 +85,7 @@ end
# Active Storage
group :storage do
gem "aws-sdk-s3", require: false
gem "google-cloud-storage", "~> 1.8", require: false
gem "google-cloud-storage", "~> 1.11", require: false
gem "azure-storage", require: false
gem "image_processing", "~> 1.2"

@ -240,21 +240,21 @@ GEM
ffi (1.9.21-x86-mingw32)
globalid (0.4.1)
activesupport (>= 4.2.0)
google-api-client (0.17.3)
google-api-client (0.19.8)
addressable (~> 2.5, >= 2.5.1)
googleauth (>= 0.5, < 0.7.0)
httpclient (>= 2.8.1, < 3.0)
mime-types (~> 3.0)
representable (~> 3.0)
retriable (>= 2.0, < 4.0)
google-cloud-core (1.1.0)
google-cloud-core (1.2.0)
google-cloud-env (~> 1.0)
google-cloud-env (1.0.1)
faraday (~> 0.11)
google-cloud-storage (1.9.0)
google-cloud-storage (1.11.0)
digest-crc (~> 0.4)
google-api-client (~> 0.17.0)
google-cloud-core (~> 1.1)
google-api-client (~> 0.19.0)
google-cloud-core (~> 1.2)
googleauth (~> 0.6.2)
googleauth (0.6.2)
faraday (~> 0.12)
@ -523,7 +523,7 @@ DEPENDENCIES
delayed_job
delayed_job_active_record
ffi (<= 1.9.21)
google-cloud-storage (~> 1.8)
google-cloud-storage (~> 1.11)
hiredis
image_processing (~> 1.2)
json (>= 2.0.0)

@ -1,3 +1,8 @@
* The Google Cloud Storage service properly supports streaming downloads.
It now requires version 1.11 or newer of the google-cloud-storage gem.
*George Claghorn*
* Use the [ImageProcessing](https://github.com/janko-m/image_processing) gem
for Active Storage variants, and deprecate the MiniMagick backend.

@ -1,6 +1,6 @@
# frozen_string_literal: true
gem "google-cloud-storage", "~> 1.8"
gem "google-cloud-storage", "~> 1.11"
require "google/cloud/storage"
require "net/http"
@ -32,28 +32,21 @@ def upload(key, io, checksum: nil)
end
end
# FIXME: Download in chunks when given a block.
def download(key)
instrument :download, key: key do
io = file_for(key).download
io.rewind
if block_given?
yield io.string
else
io.string
def download(key, &block)
if block_given?
instrument :streaming_download, key: key do
stream(key, &block)
end
else
instrument :download, key: key do
file_for(key).download.string
end
end
end
def download_chunk(key, range)
instrument :download_chunk, key: key, range: range do
file = file_for(key)
uri = URI(file.signed_url(expires: 30.seconds))
Net::HTTP.start(uri.host, uri.port, use_ssl: uri.scheme == "https") do |client|
client.get(uri, "Range" => "bytes=#{range.begin}-#{range.exclude_end? ? range.end - 1 : range.end}").body
end
file_for(key).download(range: range).string
end
end
@ -111,8 +104,21 @@ def headers_for_direct_upload(key, checksum:, **)
private
attr_reader :config
def file_for(key)
bucket.file(key, skip_lookup: true)
def file_for(key, skip_lookup: true)
bucket.file(key, skip_lookup: skip_lookup)
end
# Reads the file for the given key in chunks, yielding each to the block.
def stream(key)
file = file_for(key, skip_lookup: false)
chunk_size = 5.megabytes
offset = 0
while offset < file.size
yield file.download(range: offset..(offset + chunk_size - 1)).string
offset += chunk_size
end
end
def bucket

@ -51,13 +51,21 @@ module ActiveStorage::Service::SharedServiceTests
end
test "downloading in chunks" do
chunks = []
key = SecureRandom.base58(24)
expected_chunks = [ "a" * 5.megabytes, "b" ]
actual_chunks = []
@service.download(FIXTURE_KEY) do |chunk|
chunks << chunk
begin
@service.upload key, StringIO.new(expected_chunks.join)
@service.download key do |chunk|
actual_chunks << chunk
end
assert_equal expected_chunks, actual_chunks, "Downloaded chunks did not match uploaded data"
ensure
@service.delete key
end
assert_equal [ FIXTURE_DATA ], chunks
end
test "downloading partially" do