blob: 6a02e007e3880544ae0320689dc111d2e522df5d [file] [log] [blame]
[email protected]26b9973962012-01-28 00:57:001// Copyright (c) 2012 The Chromium Authors. All rights reserved.
[email protected]9b9ae9552010-07-01 22:20:502// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
[email protected]677c90572008-12-10 09:03:154
Lily Houghton582d4622018-01-22 22:43:405#include "net/proxy_resolution/pac_file_fetcher_impl.h"
[email protected]677c90572008-12-10 09:03:156
7#include "base/compiler_specific.h"
skyostil4891b25b2015-06-11 11:43:458#include "base/location.h"
[email protected]13a279e2009-04-13 17:32:379#include "base/logging.h"
asvitkine30330812016-08-30 04:01:0810#include "base/metrics/histogram_macros.h"
skyostil4891b25b2015-06-11 11:43:4511#include "base/single_thread_task_runner.h"
[email protected]fc9be5802013-06-11 10:56:5112#include "base/strings/string_util.h"
gabf767595f2016-05-11 18:50:3513#include "base/threading/thread_task_runner_handle.h"
[email protected]d9d71e082011-02-16 11:44:2814#include "net/base/data_url.h"
[email protected]9dea9e1f2009-01-29 00:30:4715#include "net/base/io_buffer.h"
[email protected]677c90572008-12-10 09:03:1516#include "net/base/load_flags.h"
[email protected]597cf6e2009-05-29 09:43:2617#include "net/base/net_errors.h"
[email protected]de362402014-05-10 18:32:4718#include "net/base/net_string_util.h"
[email protected]2ca01e52013-10-31 22:05:1919#include "net/base/request_priority.h"
[email protected]6e7845ae2013-03-29 21:48:1120#include "net/cert/cert_status_flags.h"
[email protected]e0ef2c22009-06-03 23:54:4421#include "net/http/http_response_headers.h"
[email protected]86933612010-10-16 23:10:3322#include "net/url_request/url_request_context.h"
[email protected]677c90572008-12-10 09:03:1523
[email protected]f0a51fb52009-03-05 12:46:3824// TODO(eroman):
[email protected]33abb682011-03-29 03:58:4225// - Support auth-prompts (http://crbug.com/77366)
[email protected]677c90572008-12-10 09:03:1526
27namespace net {
28
29namespace {
30
31// The maximum size (in bytes) allowed for a PAC script. Responses exceeding
32// this will fail with ERR_FILE_TOO_BIG.
[email protected]86933612010-10-16 23:10:3333const int kDefaultMaxResponseBytes = 1048576; // 1 megabyte
[email protected]677c90572008-12-10 09:03:1534
35// The maximum duration (in milliseconds) allowed for fetching the PAC script.
36// Responses exceeding this will fail with ERR_TIMED_OUT.
Eric Romancdb1d1c2018-01-03 21:17:0837//
38// This timeout applies to both scripts fetched in the course of WPAD, as well
39// as explicitly configured ones.
40//
41// If the default timeout is too high, auto-detect can stall for a long time,
42// and if it is too low then slow loading scripts may be skipped.
43//
44// 30 seconds is a compromise between those competing goals. This value also
45// appears to match Microsoft Edge (based on testing).
46constexpr base::TimeDelta kDefaultMaxDuration =
47 base::TimeDelta::FromSeconds(30);
[email protected]677c90572008-12-10 09:03:1548
[email protected]13a279e2009-04-13 17:32:3749// Returns true if |mime_type| is one of the known PAC mime type.
50bool IsPacMimeType(const std::string& mime_type) {
Lily Houghton9844d322018-01-20 05:44:0151 static const char* const kSupportedPacMimeTypes[] = {
52 "application/x-ns-proxy-autoconfig", "application/x-javascript-config",
[email protected]13a279e2009-04-13 17:32:3753 };
54 for (size_t i = 0; i < arraysize(kSupportedPacMimeTypes); ++i) {
brettwbc17d2c82015-06-09 22:39:0855 if (base::LowerCaseEqualsASCII(mime_type, kSupportedPacMimeTypes[i]))
[email protected]13a279e2009-04-13 17:32:3756 return true;
57 }
58 return false;
59}
60
[email protected]9b9ae9552010-07-01 22:20:5061// Converts |bytes| (which is encoded by |charset|) to UTF16, saving the resul
62// to |*utf16|.
[email protected]8f3c96342009-09-22 03:06:5463// If |charset| is empty, then we don't know what it was and guess.
[email protected]9b9ae9552010-07-01 22:20:5064void ConvertResponseToUTF16(const std::string& charset,
65 const std::string& bytes,
[email protected]42cba2fb2013-03-29 19:58:5766 base::string16* utf16) {
[email protected]8f3c96342009-09-22 03:06:5467 const char* codepage;
68
69 if (charset.empty()) {
70 // Assume ISO-8859-1 if no charset was specified.
[email protected]de362402014-05-10 18:32:4771 codepage = kCharsetLatin1;
[email protected]8f3c96342009-09-22 03:06:5472 } else {
73 // Otherwise trust the charset that was provided.
74 codepage = charset.c_str();
75 }
76
[email protected]de362402014-05-10 18:32:4777 // Be generous in the conversion -- if any characters lie outside of |charset|
78 // (i.e. invalid), then substitute them with U+FFFD rather than failing.
79 ConvertToUTF16WithSubstitutions(bytes, codepage, utf16);
[email protected]8f3c96342009-09-22 03:06:5480}
81
[email protected]677c90572008-12-10 09:03:1582} // namespace
83
Lily Houghton99597862018-03-07 16:40:4284PacFileFetcherImpl::PacFileFetcherImpl(URLRequestContext* url_request_context)
kulkarni.acd7b4462014-08-28 07:41:3485 : url_request_context_(url_request_context),
[email protected]da968bc2011-01-19 11:48:1986 buf_(new IOBuffer(kBufSize)),
[email protected]677c90572008-12-10 09:03:1587 next_id_(0),
[email protected]677c90572008-12-10 09:03:1588 cur_request_id_(0),
[email protected]677c90572008-12-10 09:03:1589 result_code_(OK),
[email protected]86933612010-10-16 23:10:3390 result_text_(NULL),
91 max_response_bytes_(kDefaultMaxResponseBytes),
Eric Romancdb1d1c2018-01-03 21:17:0892 max_duration_(kDefaultMaxDuration),
kulkarni.acd7b4462014-08-28 07:41:3493 weak_factory_(this) {
[email protected]677c90572008-12-10 09:03:1594 DCHECK(url_request_context);
95}
96
Lily Houghton99597862018-03-07 16:40:4297PacFileFetcherImpl::~PacFileFetcherImpl() {
[email protected]da968bc2011-01-19 11:48:1998 // The URLRequest's destructor will cancel the outstanding request, and
[email protected]677c90572008-12-10 09:03:1599 // ensure that the delegate (this) is not called again.
100}
101
Lily Houghton99597862018-03-07 16:40:42102base::TimeDelta PacFileFetcherImpl::SetTimeoutConstraint(
[email protected]7aefb152011-01-21 23:46:49103 base::TimeDelta timeout) {
104 base::TimeDelta prev = max_duration_;
105 max_duration_ = timeout;
106 return prev;
107}
108
Lily Houghton99597862018-03-07 16:40:42109size_t PacFileFetcherImpl::SetSizeConstraint(size_t size_bytes) {
[email protected]7aefb152011-01-21 23:46:49110 size_t prev = max_response_bytes_;
111 max_response_bytes_ = size_bytes;
112 return prev;
113}
114
Lily Houghton99597862018-03-07 16:40:42115void PacFileFetcherImpl::OnResponseCompleted(URLRequest* request,
116 int net_error) {
[email protected]7aefb152011-01-21 23:46:49117 DCHECK_EQ(request, cur_request_.get());
118
119 // Use |result_code_| as the request's error if we have already set it to
120 // something specific.
maksim.sisovbf794e22016-09-13 09:20:34121 if (result_code_ == OK && net_error != OK)
122 result_code_ = net_error;
[email protected]7aefb152011-01-21 23:46:49123
124 FetchCompleted();
125}
126
Ramin Halavatibb8c4d82018-03-16 08:04:31127int PacFileFetcherImpl::Fetch(
128 const GURL& url,
129 base::string16* text,
130 const CompletionCallback& callback,
131 const NetworkTrafficAnnotationTag traffic_annotation) {
[email protected]677c90572008-12-10 09:03:15132 // It is invalid to call Fetch() while a request is already in progress.
133 DCHECK(!cur_request_.get());
[email protected]235786812011-12-20 02:15:31134 DCHECK(!callback.is_null());
[email protected]9b9ae9552010-07-01 22:20:50135 DCHECK(text);
[email protected]677c90572008-12-10 09:03:15136
mmenkeed8d7e432017-05-03 16:48:33137 if (!url_request_context_)
138 return ERR_CONTEXT_SHUT_DOWN;
139
[email protected]d9d71e082011-02-16 11:44:28140 // Handle base-64 encoded data-urls that contain custom PAC scripts.
141 if (url.SchemeIs("data")) {
142 std::string mime_type;
143 std::string charset;
144 std::string data;
145 if (!DataURL::Parse(url, &mime_type, &charset, &data))
146 return ERR_FAILED;
147
148 ConvertResponseToUTF16(charset, data, text);
149 return OK;
150 }
151
cbentzel27d2e5e52015-07-10 17:39:56152 DCHECK(fetch_start_time_.is_null());
cbentzele45ccba2015-08-21 18:23:14153 fetch_start_time_ = base::TimeTicks::Now();
cbentzel27d2e5e52015-07-10 17:39:56154
mmenkeed8d7e432017-05-03 16:48:33155 // Use highest priority, so if socket pools are being used for other types of
156 // requests, PAC requests are aren't blocked on them.
rhalavatide8bf4e2017-05-16 06:09:11157 cur_request_ = url_request_context_->CreateRequest(url, MAXIMUM_PRIORITY,
158 this, traffic_annotation);
Matt Menke510ceaa12018-01-09 17:52:26159 cur_request_->set_is_pac_request(true);
[email protected]677c90572008-12-10 09:03:15160
161 // Make sure that the PAC script is downloaded using a direct connection,
162 // to avoid circular dependencies (fetching is a part of proxy resolution).
[email protected]e0ef2c22009-06-03 23:54:44163 // Also disable the use of the disk cache. The cache is disabled so that if
164 // the user switches networks we don't potentially use the cached response
165 // from old network when we should in fact be re-fetching on the new network.
[email protected]6fbac162011-06-20 00:29:04166 // If the PAC script is hosted on an HTTPS server we bypass revocation
167 // checking in order to avoid a circular dependency when attempting to fetch
168 // the OCSP response or CRL. We could make the revocation check go direct but
mmenkeed8d7e432017-05-03 16:48:33169 // the proxy might be the only way to the outside world. IGNORE_LIMITS is
170 // used to avoid blocking proxy resolution on other network requests.
[email protected]bb1c4662013-11-14 00:00:07171 cur_request_->SetLoadFlags(LOAD_BYPASS_PROXY | LOAD_DISABLE_CACHE |
mmenkeed8d7e432017-05-03 16:48:33172 LOAD_DISABLE_CERT_REVOCATION_CHECKING |
173 LOAD_IGNORE_LIMITS);
[email protected]677c90572008-12-10 09:03:15174
175 // Save the caller's info for notification on completion.
176 callback_ = callback;
[email protected]9b9ae9552010-07-01 22:20:50177 result_text_ = text;
178
179 bytes_read_so_far_.clear();
[email protected]677c90572008-12-10 09:03:15180
181 // Post a task to timeout this request if it takes too long.
182 cur_request_id_ = ++next_id_;
eromane1867242015-04-23 23:07:44183
skyostil4891b25b2015-06-11 11:43:45184 base::ThreadTaskRunnerHandle::Get()->PostDelayedTask(
Lily Houghton9844d322018-01-20 05:44:01185 FROM_HERE,
Lily Houghton99597862018-03-07 16:40:42186 base::Bind(&PacFileFetcherImpl::OnTimeout, weak_factory_.GetWeakPtr(),
Lily Houghton9844d322018-01-20 05:44:01187 cur_request_id_),
[email protected]26b9973962012-01-28 00:57:00188 max_duration_);
[email protected]677c90572008-12-10 09:03:15189
190 // Start the request.
191 cur_request_->Start();
[email protected]620f5712009-08-04 22:43:12192 return ERR_IO_PENDING;
[email protected]677c90572008-12-10 09:03:15193}
194
Lily Houghton99597862018-03-07 16:40:42195void PacFileFetcherImpl::Cancel() {
[email protected]da968bc2011-01-19 11:48:19196 // ResetCurRequestState will free the URLRequest, which will cause
[email protected]677c90572008-12-10 09:03:15197 // cancellation.
198 ResetCurRequestState();
199}
200
Lily Houghton99597862018-03-07 16:40:42201URLRequestContext* PacFileFetcherImpl::GetRequestContext() const {
[email protected]20d296ddc2009-11-18 23:07:08202 return url_request_context_;
203}
204
Lily Houghton99597862018-03-07 16:40:42205void PacFileFetcherImpl::OnShutdown() {
mmenkeed8d7e432017-05-03 16:48:33206 url_request_context_ = nullptr;
207
208 if (cur_request_) {
209 result_code_ = ERR_CONTEXT_SHUT_DOWN;
210 FetchCompleted();
211 }
212}
213
Lily Houghton99597862018-03-07 16:40:42214void PacFileFetcherImpl::OnAuthRequired(URLRequest* request,
215 AuthChallengeInfo* auth_info) {
[email protected]0967249162010-11-20 00:13:32216 DCHECK_EQ(request, cur_request_.get());
[email protected]33abb682011-03-29 03:58:42217 // TODO(eroman): http://crbug.com/77366
[email protected]13a279e2009-04-13 17:32:37218 LOG(WARNING) << "Auth required to fetch PAC script, aborting.";
[email protected]677c90572008-12-10 09:03:15219 result_code_ = ERR_NOT_IMPLEMENTED;
220 request->CancelAuth();
221}
222
Lily Houghton99597862018-03-07 16:40:42223void PacFileFetcherImpl::OnSSLCertificateError(URLRequest* request,
224 const SSLInfo& ssl_info,
225 bool fatal) {
[email protected]0967249162010-11-20 00:13:32226 DCHECK_EQ(request, cur_request_.get());
[email protected]5db5a73d2011-10-12 16:19:36227 // Revocation check failures are not fatal.
228 if (IsCertStatusMinorError(ssl_info.cert_status)) {
229 request->ContinueDespiteLastError();
230 return;
231 }
[email protected]13a279e2009-04-13 17:32:37232 LOG(WARNING) << "SSL certificate error when fetching PAC script, aborting.";
[email protected]677c90572008-12-10 09:03:15233 // Certificate errors are in same space as net errors.
[email protected]e5624f02011-09-27 19:43:53234 result_code_ = MapCertStatusToNetError(ssl_info.cert_status);
[email protected]677c90572008-12-10 09:03:15235 request->Cancel();
236}
237
Lily Houghton99597862018-03-07 16:40:42238void PacFileFetcherImpl::OnResponseStarted(URLRequest* request, int net_error) {
[email protected]0967249162010-11-20 00:13:32239 DCHECK_EQ(request, cur_request_.get());
maksim.sisovbf794e22016-09-13 09:20:34240 DCHECK_NE(ERR_IO_PENDING, net_error);
[email protected]677c90572008-12-10 09:03:15241
maksim.sisovbf794e22016-09-13 09:20:34242 if (net_error != OK) {
243 OnResponseCompleted(request, net_error);
[email protected]677c90572008-12-10 09:03:15244 return;
245 }
246
247 // Require HTTP responses to have a success status code.
[email protected]91f5689032013-08-22 01:43:33248 if (request->url().SchemeIsHTTPOrHTTPS()) {
[email protected]f0a51fb52009-03-05 12:46:38249 // NOTE about status codes: We are like Firefox 3 in this respect.
[email protected]677c90572008-12-10 09:03:15250 // {IE 7, Safari 3, Opera 9.5} do not care about the status code.
251 if (request->GetResponseCode() != 200) {
[email protected]b30a3f52010-10-16 01:05:46252 VLOG(1) << "Fetched PAC script had (bad) status line: "
253 << request->response_headers()->GetStatusLine();
[email protected]677c90572008-12-10 09:03:15254 result_code_ = ERR_PAC_STATUS_NOT_OK;
255 request->Cancel();
256 return;
257 }
[email protected]13a279e2009-04-13 17:32:37258
259 // NOTE about mime types: We do not enforce mime types on PAC files.
260 // This is for compatibility with {IE 7, Firefox 3, Opera 9.5}. We will
261 // however log mismatches to help with debugging.
[email protected]e0ef2c22009-06-03 23:54:44262 std::string mime_type;
263 cur_request_->GetMimeType(&mime_type);
264 if (!IsPacMimeType(mime_type)) {
[email protected]b30a3f52010-10-16 01:05:46265 VLOG(1) << "Fetched PAC script does not have a proper mime type: "
266 << mime_type;
[email protected]13a279e2009-04-13 17:32:37267 }
[email protected]677c90572008-12-10 09:03:15268 }
269
270 ReadBody(request);
271}
272
Lily Houghton99597862018-03-07 16:40:42273void PacFileFetcherImpl::OnReadCompleted(URLRequest* request, int num_bytes) {
maksim.sisovbf794e22016-09-13 09:20:34274 DCHECK_NE(ERR_IO_PENDING, num_bytes);
275
[email protected]0967249162010-11-20 00:13:32276 DCHECK_EQ(request, cur_request_.get());
277 if (ConsumeBytesRead(request, num_bytes)) {
278 // Keep reading.
[email protected]677c90572008-12-10 09:03:15279 ReadBody(request);
[email protected]677c90572008-12-10 09:03:15280 }
281}
282
Lily Houghton99597862018-03-07 16:40:42283void PacFileFetcherImpl::ReadBody(URLRequest* request) {
[email protected]0967249162010-11-20 00:13:32284 // Read as many bytes as are available synchronously.
285 while (true) {
maksim.sisovbf794e22016-09-13 09:20:34286 int num_bytes = request->Read(buf_.get(), kBufSize);
287 if (num_bytes == ERR_IO_PENDING)
288 return;
289
290 if (num_bytes < 0) {
291 OnResponseCompleted(request, num_bytes);
[email protected]0967249162010-11-20 00:13:32292 return;
293 }
maksim.sisovbf794e22016-09-13 09:20:34294
[email protected]0967249162010-11-20 00:13:32295 if (!ConsumeBytesRead(request, num_bytes))
296 return;
[email protected]677c90572008-12-10 09:03:15297 }
298}
299
Lily Houghton99597862018-03-07 16:40:42300bool PacFileFetcherImpl::ConsumeBytesRead(URLRequest* request, int num_bytes) {
Eric Romanf4174852018-02-16 22:47:13301 if (fetch_time_to_first_byte_.is_null())
302 fetch_time_to_first_byte_ = base::TimeTicks::Now();
303
[email protected]0967249162010-11-20 00:13:32304 if (num_bytes <= 0) {
305 // Error while reading, or EOF.
maksim.sisovbf794e22016-09-13 09:20:34306 OnResponseCompleted(request, num_bytes);
[email protected]0967249162010-11-20 00:13:32307 return false;
308 }
309
310 // Enforce maximum size bound.
311 if (num_bytes + bytes_read_so_far_.size() >
312 static_cast<size_t>(max_response_bytes_)) {
313 result_code_ = ERR_FILE_TOO_BIG;
314 request->Cancel();
315 return false;
316 }
317
[email protected]0967249162010-11-20 00:13:32318 bytes_read_so_far_.append(buf_->data(), num_bytes);
319 return true;
320}
321
Lily Houghton99597862018-03-07 16:40:42322void PacFileFetcherImpl::FetchCompleted() {
[email protected]8f3c96342009-09-22 03:06:54323 if (result_code_ == OK) {
Lily Houghton99597862018-03-07 16:40:42324 // Calculate duration of time for PAC file fetch to complete.
cbentzel27d2e5e52015-07-10 17:39:56325 DCHECK(!fetch_start_time_.is_null());
cbentzele45ccba2015-08-21 18:23:14326 DCHECK(!fetch_time_to_first_byte_.is_null());
327 UMA_HISTOGRAM_MEDIUM_TIMES("Net.ProxyScriptFetcher.SuccessDuration",
328 base::TimeTicks::Now() - fetch_start_time_);
329 UMA_HISTOGRAM_MEDIUM_TIMES("Net.ProxyScriptFetcher.FirstByteDuration",
330 fetch_time_to_first_byte_ - fetch_start_time_);
cbentzel27d2e5e52015-07-10 17:39:56331
[email protected]9b9ae9552010-07-01 22:20:50332 // The caller expects the response to be encoded as UTF16.
[email protected]8f3c96342009-09-22 03:06:54333 std::string charset;
334 cur_request_->GetCharset(&charset);
[email protected]9b9ae9552010-07-01 22:20:50335 ConvertResponseToUTF16(charset, bytes_read_so_far_, result_text_);
[email protected]8f3c96342009-09-22 03:06:54336 } else {
337 // On error, the caller expects empty string for bytes.
[email protected]9b9ae9552010-07-01 22:20:50338 result_text_->clear();
[email protected]8f3c96342009-09-22 03:06:54339 }
[email protected]677c90572008-12-10 09:03:15340
341 int result_code = result_code_;
[email protected]235786812011-12-20 02:15:31342 CompletionCallback callback = callback_;
[email protected]677c90572008-12-10 09:03:15343
344 ResetCurRequestState();
345
[email protected]235786812011-12-20 02:15:31346 callback.Run(result_code);
[email protected]677c90572008-12-10 09:03:15347}
348
Lily Houghton99597862018-03-07 16:40:42349void PacFileFetcherImpl::ResetCurRequestState() {
[email protected]677c90572008-12-10 09:03:15350 cur_request_.reset();
351 cur_request_id_ = 0;
[email protected]235786812011-12-20 02:15:31352 callback_.Reset();
[email protected]677c90572008-12-10 09:03:15353 result_code_ = OK;
[email protected]9b9ae9552010-07-01 22:20:50354 result_text_ = NULL;
cbentzele45ccba2015-08-21 18:23:14355 fetch_start_time_ = base::TimeTicks();
356 fetch_time_to_first_byte_ = base::TimeTicks();
[email protected]677c90572008-12-10 09:03:15357}
358
Lily Houghton99597862018-03-07 16:40:42359void PacFileFetcherImpl::OnTimeout(int id) {
[email protected]da968bc2011-01-19 11:48:19360 // Timeout tasks may outlive the URLRequest they reference. Make sure it
[email protected]677c90572008-12-10 09:03:15361 // is still applicable.
362 if (cur_request_id_ != id)
363 return;
364
365 DCHECK(cur_request_.get());
366 result_code_ = ERR_TIMED_OUT;
mmenkeed8d7e432017-05-03 16:48:33367 FetchCompleted();
[email protected]677c90572008-12-10 09:03:15368}
369
[email protected]677c90572008-12-10 09:03:15370} // namespace net