2017-08-12 08:32:15 -04:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2017-07-04 12:11:06 -04:00
|
|
|
require "test_helper"
|
|
|
|
require "database/setup"
|
|
|
|
|
2017-07-27 16:15:38 -04:00
|
|
|
class ActiveStorage::DiskControllerTest < ActionDispatch::IntegrationTest
|
2017-07-04 12:11:06 -04:00
|
|
|
test "showing blob inline" do
|
Prevent content type and disposition bypass in storage service URLs
* Force content-type to binary on service urls for relevant content types
We have a list of content types that must be forcibly served as binary,
but in practice this only means to serve them as attachment always. We
should also set the Content-Type to the configured binary type.
As a bonus: add text/cache-manifest to the list of content types to be
served as binary by default.
* Store content-disposition and content-type in GCS
Forcing these in the service_url when serving the file works fine for S3
and Azure, since these services include params in the signature.
However, GCS specifically excludes response-content-disposition and
response-content-type from the signature, which means an attacker can
modify these and have files that should be served as text/plain attachments
served as inline HTML for example. This makes our attempt to force
specific files to be served as binary and as attachment can be easily
bypassed.
The only way this can be forced in GCS is by storing
content-disposition and content-type in the object metadata.
* Update GCS object metadata after identifying blob
In some cases we create the blob and upload the data before identifying
the content-type, which means we can't store that in GCS right when
uploading. In these, after creating the attachment, we enqueue a job to
identify the blob, and set the content-type.
In other cases, files are uploaded to the storage service via direct
upload link. We create the blob before the direct upload, which happens
independently from the blob creation itself. We then mark the blob as
identified, but we have already the content-type we need without having
put it in the service.
In these two cases, then, we need to update the metadata in the GCS
service.
* Include content-type and disposition in the verified key for disk service
This prevents an attacker from modifying these params in the service
signed URL, which is particularly important when we want to force them
to have specific values for security reasons.
* Allow only a list of specific content types to be served inline
This is different from the content types that must be served as binary
in the sense that any content type not in this list will be always
served as attachment but with its original content type. Only types in
this list are allowed to be served either inline or as attachment.
Apart from forcing this in the service URL, for GCS we need to store the
disposition in the metadata.
Fix CVE-2018-16477.
2018-09-06 10:52:52 -04:00
|
|
|
blob = create_blob(filename: "hello.jpg", content_type: "image/jpg")
|
|
|
|
|
2019-07-22 11:46:02 -04:00
|
|
|
get blob.url
|
2018-07-15 19:58:14 -04:00
|
|
|
assert_response :ok
|
Prevent content type and disposition bypass in storage service URLs
* Force content-type to binary on service urls for relevant content types
We have a list of content types that must be forcibly served as binary,
but in practice this only means to serve them as attachment always. We
should also set the Content-Type to the configured binary type.
As a bonus: add text/cache-manifest to the list of content types to be
served as binary by default.
* Store content-disposition and content-type in GCS
Forcing these in the service_url when serving the file works fine for S3
and Azure, since these services include params in the signature.
However, GCS specifically excludes response-content-disposition and
response-content-type from the signature, which means an attacker can
modify these and have files that should be served as text/plain attachments
served as inline HTML for example. This makes our attempt to force
specific files to be served as binary and as attachment can be easily
bypassed.
The only way this can be forced in GCS is by storing
content-disposition and content-type in the object metadata.
* Update GCS object metadata after identifying blob
In some cases we create the blob and upload the data before identifying
the content-type, which means we can't store that in GCS right when
uploading. In these, after creating the attachment, we enqueue a job to
identify the blob, and set the content-type.
In other cases, files are uploaded to the storage service via direct
upload link. We create the blob before the direct upload, which happens
independently from the blob creation itself. We then mark the blob as
identified, but we have already the content-type we need without having
put it in the service.
In these two cases, then, we need to update the metadata in the GCS
service.
* Include content-type and disposition in the verified key for disk service
This prevents an attacker from modifying these params in the service
signed URL, which is particularly important when we want to force them
to have specific values for security reasons.
* Allow only a list of specific content types to be served inline
This is different from the content types that must be served as binary
in the sense that any content type not in this list will be always
served as attachment but with its original content type. Only types in
this list are allowed to be served either inline or as attachment.
Apart from forcing this in the service URL, for GCS we need to store the
disposition in the metadata.
Fix CVE-2018-16477.
2018-09-06 10:52:52 -04:00
|
|
|
assert_equal "inline; filename=\"hello.jpg\"; filename*=UTF-8''hello.jpg", response.headers["Content-Disposition"]
|
|
|
|
assert_equal "image/jpg", response.headers["Content-Type"]
|
2018-05-03 09:03:48 -04:00
|
|
|
assert_equal "Hello world!", response.body
|
2017-07-04 12:11:06 -04:00
|
|
|
end
|
|
|
|
|
2017-07-27 16:52:57 -04:00
|
|
|
test "showing blob as attachment" do
|
2017-07-25 21:03:48 -04:00
|
|
|
blob = create_blob
|
2019-07-22 11:46:02 -04:00
|
|
|
get blob.url(disposition: :attachment)
|
2018-07-15 19:58:14 -04:00
|
|
|
assert_response :ok
|
2018-05-03 09:03:48 -04:00
|
|
|
assert_equal "attachment; filename=\"hello.txt\"; filename*=UTF-8''hello.txt", response.headers["Content-Disposition"]
|
|
|
|
assert_equal "text/plain", response.headers["Content-Type"]
|
|
|
|
assert_equal "Hello world!", response.body
|
2017-07-04 12:11:06 -04:00
|
|
|
end
|
2017-07-25 21:03:48 -04:00
|
|
|
|
2018-11-27 20:35:57 -05:00
|
|
|
test "showing blob range" do
|
2018-07-15 19:58:14 -04:00
|
|
|
blob = create_blob
|
2019-07-22 11:46:02 -04:00
|
|
|
get blob.url, headers: { "Range" => "bytes=5-9" }
|
2018-07-15 19:58:14 -04:00
|
|
|
assert_response :partial_content
|
2018-11-27 20:35:57 -05:00
|
|
|
assert_equal "attachment; filename=\"hello.txt\"; filename*=UTF-8''hello.txt", response.headers["Content-Disposition"]
|
2018-07-15 19:58:14 -04:00
|
|
|
assert_equal "text/plain", response.headers["Content-Type"]
|
|
|
|
assert_equal " worl", response.body
|
|
|
|
end
|
|
|
|
|
2018-08-18 14:03:52 -04:00
|
|
|
test "showing blob that does not exist" do
|
|
|
|
blob = create_blob
|
|
|
|
blob.delete
|
|
|
|
|
2019-07-22 11:46:02 -04:00
|
|
|
get blob.url
|
Prevent content type and disposition bypass in storage service URLs
* Force content-type to binary on service urls for relevant content types
We have a list of content types that must be forcibly served as binary,
but in practice this only means to serve them as attachment always. We
should also set the Content-Type to the configured binary type.
As a bonus: add text/cache-manifest to the list of content types to be
served as binary by default.
* Store content-disposition and content-type in GCS
Forcing these in the service_url when serving the file works fine for S3
and Azure, since these services include params in the signature.
However, GCS specifically excludes response-content-disposition and
response-content-type from the signature, which means an attacker can
modify these and have files that should be served as text/plain attachments
served as inline HTML for example. This makes our attempt to force
specific files to be served as binary and as attachment can be easily
bypassed.
The only way this can be forced in GCS is by storing
content-disposition and content-type in the object metadata.
* Update GCS object metadata after identifying blob
In some cases we create the blob and upload the data before identifying
the content-type, which means we can't store that in GCS right when
uploading. In these, after creating the attachment, we enqueue a job to
identify the blob, and set the content-type.
In other cases, files are uploaded to the storage service via direct
upload link. We create the blob before the direct upload, which happens
independently from the blob creation itself. We then mark the blob as
identified, but we have already the content-type we need without having
put it in the service.
In these two cases, then, we need to update the metadata in the GCS
service.
* Include content-type and disposition in the verified key for disk service
This prevents an attacker from modifying these params in the service
signed URL, which is particularly important when we want to force them
to have specific values for security reasons.
* Allow only a list of specific content types to be served inline
This is different from the content types that must be served as binary
in the sense that any content type not in this list will be always
served as attachment but with its original content type. Only types in
this list are allowed to be served either inline or as attachment.
Apart from forcing this in the service URL, for GCS we need to store the
disposition in the metadata.
Fix CVE-2018-16477.
2018-09-06 10:52:52 -04:00
|
|
|
end
|
|
|
|
|
|
|
|
test "showing blob with invalid key" do
|
|
|
|
get rails_disk_service_url(encoded_key: "Invalid key", filename: "hello.txt")
|
2018-08-18 14:03:52 -04:00
|
|
|
assert_response :not_found
|
|
|
|
end
|
|
|
|
|
2019-12-05 22:31:23 -05:00
|
|
|
test "showing public blob" do
|
|
|
|
with_service("local_public") do
|
|
|
|
blob = create_blob(content_type: "image/jpg")
|
|
|
|
|
|
|
|
get blob.url
|
|
|
|
assert_response :ok
|
|
|
|
assert_equal "image/jpg", response.headers["Content-Type"]
|
|
|
|
assert_equal "Hello world!", response.body
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
test "showing public blob variant" do
|
|
|
|
with_service("local_public") do
|
|
|
|
blob = create_file_blob.variant(resize_to_limit: [100, 100]).processed
|
|
|
|
|
|
|
|
get blob.url
|
|
|
|
assert_response :ok
|
|
|
|
assert_equal "image/jpeg", response.headers["Content-Type"]
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2017-07-25 21:03:48 -04:00
|
|
|
test "directly uploading blob with integrity" do
|
2017-07-27 17:05:38 -04:00
|
|
|
data = "Something else entirely!"
|
|
|
|
blob = create_blob_before_direct_upload byte_size: data.size, checksum: Digest::MD5.base64digest(data)
|
2017-07-25 21:03:48 -04:00
|
|
|
|
2017-07-27 17:05:38 -04:00
|
|
|
put blob.service_url_for_direct_upload, params: data, headers: { "Content-Type" => "text/plain" }
|
2017-07-25 21:03:48 -04:00
|
|
|
assert_response :no_content
|
|
|
|
assert_equal data, blob.download
|
|
|
|
end
|
|
|
|
|
|
|
|
test "directly uploading blob without integrity" do
|
2017-07-27 17:05:38 -04:00
|
|
|
data = "Something else entirely!"
|
|
|
|
blob = create_blob_before_direct_upload byte_size: data.size, checksum: Digest::MD5.base64digest("bad data")
|
2017-07-27 16:52:57 -04:00
|
|
|
|
2017-07-27 17:05:38 -04:00
|
|
|
put blob.service_url_for_direct_upload, params: data
|
2017-07-27 16:52:57 -04:00
|
|
|
assert_response :unprocessable_entity
|
|
|
|
assert_not blob.service.exist?(blob.key)
|
|
|
|
end
|
|
|
|
|
|
|
|
test "directly uploading blob with mismatched content type" do
|
2017-07-27 17:05:38 -04:00
|
|
|
data = "Something else entirely!"
|
|
|
|
blob = create_blob_before_direct_upload byte_size: data.size, checksum: Digest::MD5.base64digest(data)
|
2017-07-25 21:03:48 -04:00
|
|
|
|
2017-07-27 17:05:38 -04:00
|
|
|
put blob.service_url_for_direct_upload, params: data, headers: { "Content-Type" => "application/octet-stream" }
|
2017-07-27 16:52:57 -04:00
|
|
|
assert_response :unprocessable_entity
|
|
|
|
assert_not blob.service.exist?(blob.key)
|
|
|
|
end
|
2017-07-25 21:03:48 -04:00
|
|
|
|
2018-10-07 15:22:58 -04:00
|
|
|
test "directly uploading blob with different but equivalent content type" do
|
|
|
|
data = "Something else entirely!"
|
|
|
|
blob = create_blob_before_direct_upload(
|
|
|
|
byte_size: data.size, checksum: Digest::MD5.base64digest(data), content_type: "application/x-gzip")
|
|
|
|
|
|
|
|
put blob.service_url_for_direct_upload, params: data, headers: { "Content-Type" => "application/x-gzip" }
|
|
|
|
assert_response :no_content
|
|
|
|
assert_equal data, blob.download
|
|
|
|
end
|
|
|
|
|
2017-07-27 16:52:57 -04:00
|
|
|
test "directly uploading blob with mismatched content length" do
|
2017-07-27 17:05:38 -04:00
|
|
|
data = "Something else entirely!"
|
|
|
|
blob = create_blob_before_direct_upload byte_size: data.size - 1, checksum: Digest::MD5.base64digest(data)
|
2017-07-25 21:03:48 -04:00
|
|
|
|
2017-07-27 17:05:38 -04:00
|
|
|
put blob.service_url_for_direct_upload, params: data, headers: { "Content-Type" => "text/plain" }
|
2017-07-25 21:03:48 -04:00
|
|
|
assert_response :unprocessable_entity
|
|
|
|
assert_not blob.service.exist?(blob.key)
|
|
|
|
end
|
2018-07-15 20:12:53 -04:00
|
|
|
|
|
|
|
test "directly uploading blob with invalid token" do
|
|
|
|
put update_rails_disk_service_url(encoded_token: "invalid"),
|
|
|
|
params: "Something else entirely!", headers: { "Content-Type" => "text/plain" }
|
|
|
|
assert_response :not_found
|
|
|
|
end
|
2017-07-04 12:11:06 -04:00
|
|
|
end
|