| // Copyright 2017 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "content/browser/download/download_utils.h" |
| |
| #include "base/format_macros.h" |
| #include "base/memory/ptr_util.h" |
| #include "base/process/process_handle.h" |
| #include "base/strings/stringprintf.h" |
| #include "components/download/downloader/in_progress/download_entry.h" |
| #include "components/download/downloader/in_progress/in_progress_cache.h" |
| #include "content/browser/download/download_create_info.h" |
| #include "content/browser/download/download_interrupt_reasons_impl.h" |
| #include "content/browser/download/download_stats.h" |
| #include "content/public/browser/browser_context.h" |
| #include "content/public/browser/browser_thread.h" |
| #include "content/public/browser/download_manager_delegate.h" |
| #include "content/public/browser/download_save_info.h" |
| #include "content/public/browser/download_url_parameters.h" |
| #include "content/public/browser/render_frame_host.h" |
| #include "content/public/browser/render_process_host.h" |
| #include "net/base/elements_upload_data_stream.h" |
| #include "net/base/load_flags.h" |
| #include "net/base/upload_bytes_element_reader.h" |
| #include "net/http/http_request_headers.h" |
| #include "net/http/http_status_code.h" |
| #include "net/url_request/url_request_context.h" |
| #include "services/network/public/cpp/resource_request.h" |
| |
| namespace content { |
| |
| namespace { |
| |
| void AppendExtraHeaders(net::HttpRequestHeaders* headers, |
| DownloadUrlParameters* params) { |
| for (const auto& header : params->request_headers()) |
| headers->SetHeaderIfMissing(header.first, header.second); |
| } |
| |
| int GetLoadFlags(DownloadUrlParameters* params, bool has_upload_data) { |
| int load_flags = 0; |
| if (params->prefer_cache()) { |
| // If there is upload data attached, only retrieve from cache because there |
| // is no current mechanism to prompt the user for their consent for a |
| // re-post. For GETs, try to retrieve data from the cache and skip |
| // validating the entry if present. |
| if (has_upload_data) |
| load_flags |= net::LOAD_ONLY_FROM_CACHE | net::LOAD_SKIP_CACHE_VALIDATION; |
| else |
| load_flags |= net::LOAD_SKIP_CACHE_VALIDATION; |
| } else { |
| load_flags |= net::LOAD_DISABLE_CACHE; |
| } |
| return load_flags; |
| } |
| |
| std::unique_ptr<net::HttpRequestHeaders> GetAdditionalRequestHeaders( |
| DownloadUrlParameters* params) { |
| auto headers = std::make_unique<net::HttpRequestHeaders>(); |
| if (params->offset() == 0 && |
| params->length() == DownloadSaveInfo::kLengthFullContent) { |
| AppendExtraHeaders(headers.get(), params); |
| return headers; |
| } |
| |
| bool has_last_modified = !params->last_modified().empty(); |
| bool has_etag = !params->etag().empty(); |
| |
| // Strong validator(i.e. etag or last modified) is required in range requests |
| // for download resumption and parallel download. |
| DCHECK(has_etag || has_last_modified); |
| if (!has_etag && !has_last_modified) { |
| DVLOG(1) << "Creating partial request without strong validators."; |
| AppendExtraHeaders(headers.get(), params); |
| return headers; |
| } |
| |
| // Add "Range" header. |
| std::string range_header = |
| (params->length() == DownloadSaveInfo::kLengthFullContent) |
| ? base::StringPrintf("bytes=%" PRId64 "-", params->offset()) |
| : base::StringPrintf("bytes=%" PRId64 "-%" PRId64, params->offset(), |
| params->offset() + params->length() - 1); |
| headers->SetHeader(net::HttpRequestHeaders::kRange, range_header); |
| |
| // Add "If-Range" headers. |
| if (params->use_if_range()) { |
| // In accordance with RFC 7233 Section 3.2, use If-Range to specify that |
| // the server return the entire entity if the validator doesn't match. |
| // Last-Modified can be used in the absence of ETag as a validator if the |
| // response headers satisfied the HttpUtil::HasStrongValidators() |
| // predicate. |
| // |
| // This function assumes that HasStrongValidators() was true and that the |
| // ETag and Last-Modified header values supplied are valid. |
| headers->SetHeader(net::HttpRequestHeaders::kIfRange, |
| has_etag ? params->etag() : params->last_modified()); |
| AppendExtraHeaders(headers.get(), params); |
| return headers; |
| } |
| |
| // Add "If-Match"/"If-Unmodified-Since" headers. |
| if (has_etag) |
| headers->SetHeader(net::HttpRequestHeaders::kIfMatch, params->etag()); |
| |
| // According to RFC 7232 section 3.4, "If-Unmodified-Since" is mainly for |
| // old servers that didn't implement "If-Match" and must be ignored when |
| // "If-Match" presents. |
| if (has_last_modified) { |
| headers->SetHeader(net::HttpRequestHeaders::kIfUnmodifiedSince, |
| params->last_modified()); |
| } |
| |
| AppendExtraHeaders(headers.get(), params); |
| return headers; |
| } |
| |
| } // namespace |
| |
| DownloadInterruptReason HandleRequestCompletionStatus( |
| net::Error error_code, bool has_strong_validators, |
| net::CertStatus cert_status, DownloadInterruptReason abort_reason) { |
| // ERR_CONTENT_LENGTH_MISMATCH can be caused by 1 of the following reasons: |
| // 1. Server or proxy closes the connection too early. |
| // 2. The content-length header is wrong. |
| // If the download has strong validators, we can interrupt the download |
| // and let it resume automatically. Otherwise, resuming the download will |
| // cause it to restart and the download may never complete if the error was |
| // caused by reason 2. As a result, downloads without strong validators are |
| // treated as completed here. |
| // TODO(qinmin): check the metrics from downloads with strong validators, |
| // and decide whether we should interrupt downloads without strong validators |
| // rather than complete them. |
| if (error_code == net::ERR_CONTENT_LENGTH_MISMATCH && |
| !has_strong_validators) { |
| error_code = net::OK; |
| RecordDownloadCount(COMPLETED_WITH_CONTENT_LENGTH_MISMATCH_COUNT); |
| } |
| |
| if (error_code == net::ERR_ABORTED) { |
| // ERR_ABORTED == something outside of the network |
| // stack cancelled the request. There aren't that many things that |
| // could do this to a download request (whose lifetime is separated from |
| // the tab from which it came). We map this to USER_CANCELLED as the |
| // case we know about (system suspend because of laptop close) corresponds |
| // to a user action. |
| // TODO(asanka): A lid close or other power event should result in an |
| // interruption that doesn't discard the partial state, unlike |
| // USER_CANCELLED. (https://crbug.com/166179) |
| if (net::IsCertStatusError(cert_status)) |
| return DOWNLOAD_INTERRUPT_REASON_SERVER_CERT_PROBLEM; |
| else |
| return DOWNLOAD_INTERRUPT_REASON_USER_CANCELED; |
| } else if (abort_reason != DOWNLOAD_INTERRUPT_REASON_NONE) { |
| // If a more specific interrupt reason was specified before the request |
| // was explicitly cancelled, then use it. |
| return abort_reason; |
| } |
| |
| return ConvertNetErrorToInterruptReason( |
| error_code, DOWNLOAD_INTERRUPT_FROM_NETWORK); |
| } |
| |
| std::unique_ptr<network::ResourceRequest> CreateResourceRequest( |
| DownloadUrlParameters* params) { |
| DCHECK(params->offset() >= 0); |
| |
| std::unique_ptr<network::ResourceRequest> request( |
| new network::ResourceRequest); |
| request->method = params->method(); |
| request->url = params->url(); |
| request->request_initiator = params->initiator(); |
| request->do_not_prompt_for_login = params->do_not_prompt_for_login(); |
| request->site_for_cookies = params->url(); |
| request->referrer = params->referrer().url; |
| request->referrer_policy = |
| Referrer::ReferrerPolicyForUrlRequest(params->referrer().policy); |
| request->download_to_file = true; |
| request->allow_download = true; |
| request->is_main_frame = true; |
| |
| if (params->render_process_host_id() >= 0) |
| request->render_frame_id = params->render_frame_host_routing_id(); |
| |
| bool has_upload_data = false; |
| if (!params->post_body().empty()) { |
| request->request_body = network::ResourceRequestBody::CreateFromBytes( |
| params->post_body().data(), params->post_body().size()); |
| has_upload_data = true; |
| } |
| |
| if (params->post_id() >= 0) { |
| // The POST in this case does not have an actual body, and only works |
| // when retrieving data from cache. This is done because we don't want |
| // to do a re-POST without user consent, and currently don't have a good |
| // plan on how to display the UI for that. |
| DCHECK(params->prefer_cache()); |
| DCHECK_EQ("POST", params->method()); |
| request->request_body = new network::ResourceRequestBody(); |
| request->request_body->set_identifier(params->post_id()); |
| has_upload_data = true; |
| } |
| |
| request->load_flags = GetLoadFlags(params, has_upload_data); |
| |
| // Add additional request headers. |
| std::unique_ptr<net::HttpRequestHeaders> headers = |
| GetAdditionalRequestHeaders(params); |
| request->headers.Swap(headers.get()); |
| |
| return request; |
| } |
| |
| std::unique_ptr<net::URLRequest> |
| CreateURLRequestOnIOThread(DownloadUrlParameters* params) { |
| DCHECK_CURRENTLY_ON(BrowserThread::IO); |
| DCHECK(params->offset() >= 0); |
| |
| // ResourceDispatcherHost{Base} is-not-a URLRequest::Delegate, and |
| // DownloadUrlParameters can-not include resource_dispatcher_host_impl.h, so |
| // we must down cast. RDHI is the only subclass of RDH as of 2012 May 4. |
| std::unique_ptr<net::URLRequest> request( |
| params->url_request_context_getter() |
| ->GetURLRequestContext() |
| ->CreateRequest(params->url(), net::DEFAULT_PRIORITY, nullptr, |
| params->GetNetworkTrafficAnnotation())); |
| request->set_method(params->method()); |
| |
| if (!params->post_body().empty()) { |
| const std::string& body = params->post_body(); |
| std::unique_ptr<net::UploadElementReader> reader( |
| net::UploadOwnedBytesElementReader::CreateWithString(body)); |
| request->set_upload( |
| net::ElementsUploadDataStream::CreateWithReader(std::move(reader), 0)); |
| } |
| |
| if (params->post_id() >= 0) { |
| // The POST in this case does not have an actual body, and only works |
| // when retrieving data from cache. This is done because we don't want |
| // to do a re-POST without user consent, and currently don't have a good |
| // plan on how to display the UI for that. |
| DCHECK(params->prefer_cache()); |
| DCHECK_EQ("POST", params->method()); |
| std::vector<std::unique_ptr<net::UploadElementReader>> element_readers; |
| request->set_upload(std::make_unique<net::ElementsUploadDataStream>( |
| std::move(element_readers), params->post_id())); |
| } |
| |
| request->SetLoadFlags(GetLoadFlags(params, request->get_upload())); |
| |
| // Add additional request headers. |
| std::unique_ptr<net::HttpRequestHeaders> headers = |
| GetAdditionalRequestHeaders(params); |
| if (!headers->IsEmpty()) |
| request->SetExtraRequestHeaders(*headers); |
| |
| // Downloads are treated as top level navigations. Hence the first-party |
| // origin for cookies is always based on the target URL and is updated on |
| // redirects. |
| request->set_site_for_cookies(params->url()); |
| request->set_first_party_url_policy( |
| net::URLRequest::UPDATE_FIRST_PARTY_URL_ON_REDIRECT); |
| request->set_initiator(params->initiator()); |
| |
| return request; |
| } |
| |
| DownloadInterruptReason HandleSuccessfulServerResponse( |
| const net::HttpResponseHeaders& http_headers, |
| DownloadSaveInfo* save_info, |
| bool fetch_error_body) { |
| DownloadInterruptReason result = DOWNLOAD_INTERRUPT_REASON_NONE; |
| switch (http_headers.response_code()) { |
| case -1: // Non-HTTP request. |
| case net::HTTP_OK: |
| case net::HTTP_NON_AUTHORITATIVE_INFORMATION: |
| case net::HTTP_PARTIAL_CONTENT: |
| // Expected successful codes. |
| break; |
| |
| case net::HTTP_CREATED: |
| case net::HTTP_ACCEPTED: |
| // Per RFC 7231 the entity being transferred is metadata about the |
| // resource at the target URL and not the resource at that URL (or the |
| // resource that would be at the URL once processing is completed in the |
| // case of HTTP_ACCEPTED). However, we currently don't have special |
| // handling for these response and they are downloaded the same as a |
| // regular response. |
| break; |
| |
| case net::HTTP_NO_CONTENT: |
| case net::HTTP_RESET_CONTENT: |
| // These two status codes don't have an entity (or rather RFC 7231 |
| // requires that there be no entity). They are treated the same as the |
| // resource not being found since there is no entity to download. |
| |
| case net::HTTP_NOT_FOUND: |
| result = DOWNLOAD_INTERRUPT_REASON_SERVER_BAD_CONTENT; |
| break; |
| |
| case net::HTTP_REQUESTED_RANGE_NOT_SATISFIABLE: |
| // Retry by downloading from the start automatically: |
| // If we haven't received data when we get this error, we won't. |
| result = DOWNLOAD_INTERRUPT_REASON_SERVER_NO_RANGE; |
| break; |
| case net::HTTP_UNAUTHORIZED: |
| case net::HTTP_PROXY_AUTHENTICATION_REQUIRED: |
| // Server didn't authorize this request. |
| result = DOWNLOAD_INTERRUPT_REASON_SERVER_UNAUTHORIZED; |
| break; |
| case net::HTTP_FORBIDDEN: |
| // Server forbids access to this resource. |
| result = DOWNLOAD_INTERRUPT_REASON_SERVER_FORBIDDEN; |
| break; |
| default: // All other errors. |
| // Redirection and informational codes should have been handled earlier |
| // in the stack. |
| // TODO(xingliu): Handle HTTP_PRECONDITION_FAILED and resurrect |
| // DOWNLOAD_INTERRUPT_REASON_SERVER_PRECONDITION for range requests. |
| // This will change extensions::api::download::InterruptReason. |
| DCHECK_NE(3, http_headers.response_code() / 100); |
| DCHECK_NE(1, http_headers.response_code() / 100); |
| result = DOWNLOAD_INTERRUPT_REASON_SERVER_FAILED; |
| } |
| |
| if (result != DOWNLOAD_INTERRUPT_REASON_NONE && !fetch_error_body) |
| return result; |
| |
| // The caller is expecting a partial response. |
| if (save_info && (save_info->offset > 0 || save_info->length > 0)) { |
| if (http_headers.response_code() != net::HTTP_PARTIAL_CONTENT) { |
| // Server should send partial content when "If-Match" or |
| // "If-Unmodified-Since" check passes, and the range request header has |
| // last byte position. e.g. "Range:bytes=50-99". |
| if (save_info->length != DownloadSaveInfo::kLengthFullContent && |
| !fetch_error_body) |
| return DOWNLOAD_INTERRUPT_REASON_SERVER_BAD_CONTENT; |
| |
| // Requested a partial range, but received the entire response, when |
| // the range request header is "Range:bytes={offset}-". |
| // The response can be HTTP 200 or other error code when |
| // |fetch_error_body| is true. |
| save_info->offset = 0; |
| save_info->hash_of_partial_file.clear(); |
| save_info->hash_state.reset(); |
| return DOWNLOAD_INTERRUPT_REASON_NONE; |
| } |
| |
| int64_t first_byte = -1; |
| int64_t last_byte = -1; |
| int64_t length = -1; |
| if (!http_headers.GetContentRangeFor206(&first_byte, &last_byte, &length)) |
| return DOWNLOAD_INTERRUPT_REASON_SERVER_BAD_CONTENT; |
| DCHECK_GE(first_byte, 0); |
| |
| if (first_byte != save_info->offset || |
| (save_info->length > 0 && |
| last_byte != save_info->offset + save_info->length - 1)) { |
| // The server returned a different range than the one we requested. Assume |
| // the response is bad. |
| // |
| // In the future we should consider allowing offsets that are less than |
| // the offset we've requested, since in theory we can truncate the partial |
| // file at the offset and continue. |
| return DOWNLOAD_INTERRUPT_REASON_SERVER_BAD_CONTENT; |
| } |
| |
| return DOWNLOAD_INTERRUPT_REASON_NONE; |
| } |
| |
| if (http_headers.response_code() == net::HTTP_PARTIAL_CONTENT) |
| return DOWNLOAD_INTERRUPT_REASON_SERVER_BAD_CONTENT; |
| |
| return DOWNLOAD_INTERRUPT_REASON_NONE; |
| } |
| |
| void HandleResponseHeaders(const net::HttpResponseHeaders* headers, |
| DownloadCreateInfo* create_info) { |
| if (!headers) |
| return; |
| |
| if (headers->HasStrongValidators()) { |
| // If we don't have strong validators as per RFC 7232 section 2, then |
| // we neither store nor use them for range requests. |
| if (!headers->EnumerateHeader(nullptr, "Last-Modified", |
| &create_info->last_modified)) |
| create_info->last_modified.clear(); |
| if (!headers->EnumerateHeader(nullptr, "ETag", &create_info->etag)) |
| create_info->etag.clear(); |
| } |
| |
| // Grab the first content-disposition header. There may be more than one, |
| // though as of this writing, the network stack ensures if there are, they |
| // are all duplicates. |
| headers->EnumerateHeader(nullptr, "Content-Disposition", |
| &create_info->content_disposition); |
| |
| // Parse the original mime type from the header, notice that actual mime type |
| // might be different due to mime type sniffing. |
| if (!headers->GetMimeType(&create_info->original_mime_type)) |
| create_info->original_mime_type.clear(); |
| |
| // Content-Range is validated in HandleSuccessfulServerResponse. |
| // In RFC 7233, a single part 206 partial response must generate |
| // Content-Range. Accept-Range may be sent in 200 response to indicate the |
| // server can handle range request, but optional in 206 response. |
| create_info->accept_range = |
| headers->HasHeaderValue("Accept-Ranges", "bytes") || |
| (headers->HasHeader("Content-Range") && |
| headers->response_code() == net::HTTP_PARTIAL_CONTENT); |
| } |
| |
| download::DownloadSource ToDownloadSource( |
| content::DownloadSource download_source) { |
| switch (download_source) { |
| case DownloadSource::UNKNOWN: |
| return download::DownloadSource::UNKNOWN; |
| case DownloadSource::NAVIGATION: |
| return download::DownloadSource::NAVIGATION; |
| case DownloadSource::DRAG_AND_DROP: |
| return download::DownloadSource::DRAG_AND_DROP; |
| case DownloadSource::FROM_RENDERER: |
| return download::DownloadSource::FROM_RENDERER; |
| case DownloadSource::EXTENSION_API: |
| return download::DownloadSource::EXTENSION_API; |
| case DownloadSource::EXTENSION_INSTALLER: |
| return download::DownloadSource::EXTENSION_INSTALLER; |
| case DownloadSource::INTERNAL_API: |
| return download::DownloadSource::INTERNAL_API; |
| case DownloadSource::WEB_CONTENTS_API: |
| return download::DownloadSource::WEB_CONTENTS_API; |
| case DownloadSource::OFFLINE_PAGE: |
| return download::DownloadSource::OFFLINE_PAGE; |
| case DownloadSource::CONTEXT_MENU: |
| return download::DownloadSource::CONTEXT_MENU; |
| } |
| NOTREACHED(); |
| return download::DownloadSource::UNKNOWN; |
| } |
| |
| DownloadSource ToDownloadSource(download::DownloadSource download_source) { |
| switch (download_source) { |
| case download::DownloadSource::UNKNOWN: |
| return DownloadSource::UNKNOWN; |
| case download::DownloadSource::NAVIGATION: |
| return DownloadSource::NAVIGATION; |
| case download::DownloadSource::DRAG_AND_DROP: |
| return DownloadSource::DRAG_AND_DROP; |
| case download::DownloadSource::FROM_RENDERER: |
| return DownloadSource::FROM_RENDERER; |
| case download::DownloadSource::EXTENSION_API: |
| return DownloadSource::EXTENSION_API; |
| case download::DownloadSource::EXTENSION_INSTALLER: |
| return DownloadSource::EXTENSION_INSTALLER; |
| case download::DownloadSource::INTERNAL_API: |
| return DownloadSource::INTERNAL_API; |
| case download::DownloadSource::WEB_CONTENTS_API: |
| return DownloadSource::WEB_CONTENTS_API; |
| case download::DownloadSource::OFFLINE_PAGE: |
| return DownloadSource::OFFLINE_PAGE; |
| case download::DownloadSource::CONTEXT_MENU: |
| return DownloadSource::CONTEXT_MENU; |
| } |
| NOTREACHED(); |
| return DownloadSource::UNKNOWN; |
| } |
| |
| base::Optional<download::DownloadEntry> GetInProgressEntry( |
| const std::string& guid, |
| BrowserContext* browser_context) { |
| base::Optional<download::DownloadEntry> entry; |
| if (!browser_context || guid.empty()) |
| return entry; |
| |
| auto* manager_delegate = browser_context->GetDownloadManagerDelegate(); |
| if (manager_delegate) { |
| download::InProgressCache* in_progress_cache = |
| manager_delegate->GetInProgressCache(); |
| if (in_progress_cache) |
| entry = in_progress_cache->RetrieveEntry(guid); |
| } |
| return entry; |
| } |
| |
| } // namespace content |