blob: 460b980c5bd87521e13c10f151d7b8a5ebf42dd0 [file] [log] [blame]
rspangler@google.com49fdf182009-10-10 00:57:34 +00001// Copyright (c) 2009 The Chromium OS Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
rspangler@google.com49fdf182009-10-10 00:57:34 +00005#include "update_engine/libcurl_http_fetcher.h"
Andrew de los Reyesd57d1472010-10-21 13:34:08 -07006
adlr@google.comc98a7ed2009-12-04 18:54:03 +00007#include <algorithm>
Andrew de los Reyesd57d1472010-10-21 13:34:08 -07008#include <string>
9
10#include <base/logging.h>
11
12#include "update_engine/dbus_interface.h"
13#include "update_engine/flimflam_proxy.h"
14#include "update_engine/utils.h"
adlr@google.comc98a7ed2009-12-04 18:54:03 +000015
16using std::max;
17using std::make_pair;
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070018using std::string;
rspangler@google.com49fdf182009-10-10 00:57:34 +000019
20// This is a concrete implementation of HttpFetcher that uses libcurl to do the
21// http work.
22
23namespace chromeos_update_engine {
24
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -070025namespace {
26const int kMaxRetriesCount = 20;
Ken Mixterb2bf1222010-11-18 17:29:38 -080027const char kCACertificatesPath[] = "/usr/share/chromeos-ca-certificates";
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070028} // namespace {}
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -070029
rspangler@google.com49fdf182009-10-10 00:57:34 +000030LibcurlHttpFetcher::~LibcurlHttpFetcher() {
Darin Petkov9ce452b2010-11-17 14:33:28 -080031 LOG_IF(ERROR, transfer_in_progress_)
32 << "Destroying the fetcher while a transfer is in progress.";
rspangler@google.com49fdf182009-10-10 00:57:34 +000033 CleanUp();
34}
35
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070036// On error, returns false.
37bool LibcurlHttpFetcher::ConnectionIsExpensive() const {
38 if (force_connection_type_)
39 return forced_expensive_connection_;
40 NetworkConnectionType type;
41 ConcreteDbusGlib dbus_iface;
42 TEST_AND_RETURN_FALSE(FlimFlamProxy::GetConnectionType(&dbus_iface, &type));
43 LOG(INFO) << "We are connected via "
44 << FlimFlamProxy::StringForConnectionType(type);
45 return FlimFlamProxy::IsExpensiveConnectionType(type);
46}
47
Darin Petkovfc7a0ce2010-10-25 10:38:37 -070048bool LibcurlHttpFetcher::IsOfficialBuild() const {
49 return force_build_type_ ? forced_official_build_ : utils::IsOfficialBuild();
50}
51
adlr@google.comc98a7ed2009-12-04 18:54:03 +000052void LibcurlHttpFetcher::ResumeTransfer(const std::string& url) {
Andrew de los Reyes3270f742010-07-15 22:28:14 -070053 LOG(INFO) << "Starting/Resuming transfer";
rspangler@google.com49fdf182009-10-10 00:57:34 +000054 CHECK(!transfer_in_progress_);
55 url_ = url;
56 curl_multi_handle_ = curl_multi_init();
57 CHECK(curl_multi_handle_);
58
59 curl_handle_ = curl_easy_init();
60 CHECK(curl_handle_);
61
62 if (post_data_set_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +000063 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POST, 1), CURLE_OK);
64 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POSTFIELDS,
65 &post_data_[0]),
66 CURLE_OK);
67 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POSTFIELDSIZE,
68 post_data_.size()),
69 CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +000070 }
71
adlr@google.comc98a7ed2009-12-04 18:54:03 +000072 if (bytes_downloaded_ > 0) {
73 // Resume from where we left off
74 resume_offset_ = bytes_downloaded_;
75 CHECK_EQ(curl_easy_setopt(curl_handle_,
76 CURLOPT_RESUME_FROM_LARGE,
77 bytes_downloaded_), CURLE_OK);
78 }
79
80 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_WRITEDATA, this), CURLE_OK);
81 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_WRITEFUNCTION,
82 StaticLibcurlWrite), CURLE_OK);
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070083
84 string url_to_use(url_);
85 if (ConnectionIsExpensive()) {
86 LOG(INFO) << "Not initiating HTTP connection b/c we are on an expensive"
87 << " connection";
88 url_to_use = ""; // Sabotage the URL
89 }
90
Darin Petkovfc7a0ce2010-10-25 10:38:37 -070091 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_URL, url_to_use.c_str()),
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070092 CURLE_OK);
Andrew de los Reyes3270f742010-07-15 22:28:14 -070093
Darin Petkov192ced42010-07-23 16:20:24 -070094 // If the connection drops under 10 bytes/sec for 3 minutes, reconnect.
Andrew de los Reyes3270f742010-07-15 22:28:14 -070095 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_LOW_SPEED_LIMIT, 10),
96 CURLE_OK);
Darin Petkov192ced42010-07-23 16:20:24 -070097 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_LOW_SPEED_TIME, 3 * 60),
Andrew de los Reyes3270f742010-07-15 22:28:14 -070098 CURLE_OK);
99
Darin Petkov41c2fcf2010-08-25 13:14:48 -0700100 // By default, libcurl doesn't follow redirections. Allow up to
101 // |kMaxRedirects| redirections.
Darin Petkov3a4016a2010-09-28 13:54:17 -0700102 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_FOLLOWLOCATION, 1), CURLE_OK);
Darin Petkov41c2fcf2010-08-25 13:14:48 -0700103 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_MAXREDIRS, kMaxRedirects),
104 CURLE_OK);
105
Darin Petkove237d192010-11-16 10:26:08 -0800106 // Security lock-down in official builds: makes sure that peer certificate
107 // verification is enabled, restricts the set of trusted certificates,
108 // restricts protocols to HTTPS, restricts ciphers to HIGH.
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700109 if (IsOfficialBuild()) {
Darin Petkove237d192010-11-16 10:26:08 -0800110 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_SSL_VERIFYPEER, 1),
111 CURLE_OK);
112 CHECK_EQ(curl_easy_setopt(curl_handle_,
113 CURLOPT_CAPATH,
114 kCACertificatesPath),
115 CURLE_OK);
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700116 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_PROTOCOLS, CURLPROTO_HTTPS),
117 CURLE_OK);
118 CHECK_EQ(curl_easy_setopt(curl_handle_,
119 CURLOPT_REDIR_PROTOCOLS,
120 CURLPROTO_HTTPS),
121 CURLE_OK);
Darin Petkove237d192010-11-16 10:26:08 -0800122 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_SSL_CIPHER_LIST, "HIGH"),
123 CURLE_OK);
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700124 }
125
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000126 CHECK_EQ(curl_multi_add_handle(curl_multi_handle_, curl_handle_), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000127 transfer_in_progress_ = true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000128}
129
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000130// Begins the transfer, which must not have already been started.
131void LibcurlHttpFetcher::BeginTransfer(const std::string& url) {
132 transfer_size_ = -1;
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000133 resume_offset_ = 0;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700134 retry_count_ = 0;
Darin Petkovcb466212010-08-26 09:40:11 -0700135 http_response_code_ = 0;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700136 ResumeTransfer(url);
137 CurlPerformOnce();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000138}
139
Darin Petkov9ce452b2010-11-17 14:33:28 -0800140void LibcurlHttpFetcher::ForceTransferTermination() {
141 CleanUp();
142 if (delegate_) {
143 // Note that after the callback returns this object may be destroyed.
144 delegate_->TransferTerminated(this);
145 }
146}
147
rspangler@google.com49fdf182009-10-10 00:57:34 +0000148void LibcurlHttpFetcher::TerminateTransfer() {
Darin Petkov9ce452b2010-11-17 14:33:28 -0800149 if (in_write_callback_) {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700150 terminate_requested_ = true;
Darin Petkov9ce452b2010-11-17 14:33:28 -0800151 } else {
152 ForceTransferTermination();
153 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000154}
155
Andrew de los Reyescb319332010-07-19 10:55:01 -0700156void LibcurlHttpFetcher::CurlPerformOnce() {
rspangler@google.com49fdf182009-10-10 00:57:34 +0000157 CHECK(transfer_in_progress_);
158 int running_handles = 0;
159 CURLMcode retcode = CURLM_CALL_MULTI_PERFORM;
160
161 // libcurl may request that we immediately call curl_multi_perform after it
162 // returns, so we do. libcurl promises that curl_multi_perform will not block.
163 while (CURLM_CALL_MULTI_PERFORM == retcode) {
164 retcode = curl_multi_perform(curl_multi_handle_, &running_handles);
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700165 if (terminate_requested_) {
Darin Petkov9ce452b2010-11-17 14:33:28 -0800166 ForceTransferTermination();
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700167 return;
168 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000169 }
170 if (0 == running_handles) {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700171 GetHttpResponseCode();
172 if (http_response_code_) {
173 LOG(INFO) << "HTTP response code: " << http_response_code_;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700174 } else {
175 LOG(ERROR) << "Unable to get http response code.";
176 }
Darin Petkov192ced42010-07-23 16:20:24 -0700177
rspangler@google.com49fdf182009-10-10 00:57:34 +0000178 // we're done!
179 CleanUp();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000180
181 if ((transfer_size_ >= 0) && (bytes_downloaded_ < transfer_size_)) {
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700182 // Need to restart transfer
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700183 retry_count_++;
184 LOG(INFO) << "Restarting transfer b/c we finished, had downloaded "
185 << bytes_downloaded_ << " bytes, but transfer_size_ is "
186 << transfer_size_ << ". retry_count: " << retry_count_;
187 if (retry_count_ > kMaxRetriesCount) {
188 if (delegate_)
189 delegate_->TransferComplete(this, false); // success
190 } else {
Darin Petkovb83371f2010-08-17 09:34:49 -0700191 g_timeout_add_seconds(retry_seconds_,
Darin Petkov9b111652010-08-16 11:46:25 -0700192 &LibcurlHttpFetcher::StaticRetryTimeoutCallback,
193 this);
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700194 }
Andrew de los Reyescb319332010-07-19 10:55:01 -0700195 return;
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000196 } else {
197 if (delegate_) {
Andrew de los Reyesfb4ad7d2010-07-19 10:43:46 -0700198 // success is when http_response_code is 2xx
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700199 bool success = (http_response_code_ >= 200) &&
200 (http_response_code_ < 300);
Andrew de los Reyesfb4ad7d2010-07-19 10:43:46 -0700201 delegate_->TransferComplete(this, success);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000202 }
203 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000204 } else {
205 // set up callback
206 SetupMainloopSources();
207 }
208}
209
210size_t LibcurlHttpFetcher::LibcurlWrite(void *ptr, size_t size, size_t nmemb) {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700211 GetHttpResponseCode();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000212 {
213 double transfer_size_double;
214 CHECK_EQ(curl_easy_getinfo(curl_handle_,
215 CURLINFO_CONTENT_LENGTH_DOWNLOAD,
216 &transfer_size_double), CURLE_OK);
217 off_t new_transfer_size = static_cast<off_t>(transfer_size_double);
218 if (new_transfer_size > 0) {
219 transfer_size_ = resume_offset_ + new_transfer_size;
220 }
221 }
222 bytes_downloaded_ += size * nmemb;
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700223 in_write_callback_ = true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000224 if (delegate_)
225 delegate_->ReceivedBytes(this, reinterpret_cast<char*>(ptr), size * nmemb);
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700226 in_write_callback_ = false;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000227 return size * nmemb;
228}
229
230void LibcurlHttpFetcher::Pause() {
231 CHECK(curl_handle_);
232 CHECK(transfer_in_progress_);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000233 CHECK_EQ(curl_easy_pause(curl_handle_, CURLPAUSE_ALL), CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000234}
235
236void LibcurlHttpFetcher::Unpause() {
237 CHECK(curl_handle_);
238 CHECK(transfer_in_progress_);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000239 CHECK_EQ(curl_easy_pause(curl_handle_, CURLPAUSE_CONT), CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000240}
241
242// This method sets up callbacks with the glib main loop.
243void LibcurlHttpFetcher::SetupMainloopSources() {
244 fd_set fd_read;
245 fd_set fd_write;
Darin Petkov60e14152010-10-27 16:57:04 -0700246 fd_set fd_exc;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000247
248 FD_ZERO(&fd_read);
249 FD_ZERO(&fd_write);
Darin Petkov60e14152010-10-27 16:57:04 -0700250 FD_ZERO(&fd_exc);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000251
252 int fd_max = 0;
253
254 // Ask libcurl for the set of file descriptors we should track on its
255 // behalf.
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000256 CHECK_EQ(curl_multi_fdset(curl_multi_handle_, &fd_read, &fd_write,
Darin Petkov60e14152010-10-27 16:57:04 -0700257 &fd_exc, &fd_max), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000258
259 // We should iterate through all file descriptors up to libcurl's fd_max or
Darin Petkov60e14152010-10-27 16:57:04 -0700260 // the highest one we're tracking, whichever is larger.
261 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
262 if (!io_channels_[t].empty())
263 fd_max = max(fd_max, io_channels_[t].rbegin()->first);
264 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000265
Darin Petkov60e14152010-10-27 16:57:04 -0700266 // For each fd, if we're not tracking it, track it. If we are tracking it, but
267 // libcurl doesn't care about it anymore, stop tracking it. After this loop,
268 // there should be exactly as many GIOChannel objects in io_channels_[0|1] as
269 // there are read/write fds that we're tracking.
270 for (int fd = 0; fd <= fd_max; ++fd) {
271 // Note that fd_exc is unused in the current version of libcurl so is_exc
272 // should always be false.
273 bool is_exc = FD_ISSET(fd, &fd_exc) != 0;
274 bool must_track[2] = {
275 is_exc || (FD_ISSET(fd, &fd_read) != 0), // track 0 -- read
276 is_exc || (FD_ISSET(fd, &fd_write) != 0) // track 1 -- write
277 };
278
279 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
280 bool tracked = io_channels_[t].find(fd) != io_channels_[t].end();
281
282 if (!must_track[t]) {
283 // If we have an outstanding io_channel, remove it.
284 if (tracked) {
285 g_source_remove(io_channels_[t][fd].second);
286 g_io_channel_unref(io_channels_[t][fd].first);
287 io_channels_[t].erase(io_channels_[t].find(fd));
288 }
289 continue;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000290 }
Darin Petkov60e14152010-10-27 16:57:04 -0700291
292 // If we are already tracking this fd, continue -- nothing to do.
293 if (tracked)
294 continue;
295
296 // Set conditions appropriately -- read for track 0, write for track 1.
297 GIOCondition condition = static_cast<GIOCondition>(
298 ((t == 0) ? (G_IO_IN | G_IO_PRI) : G_IO_OUT) | G_IO_ERR | G_IO_HUP);
299
300 // Track a new fd.
301 GIOChannel* io_channel = g_io_channel_unix_new(fd);
302 guint tag =
303 g_io_add_watch(io_channel, condition, &StaticFDCallback, this);
304
305 io_channels_[t][fd] = make_pair(io_channel, tag);
306 static int io_counter = 0;
307 io_counter++;
308 if (io_counter % 50 == 0) {
309 LOG(INFO) << "io_counter = " << io_counter;
310 }
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700311 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000312 }
313
Darin Petkovb83371f2010-08-17 09:34:49 -0700314 // Set up a timeout callback for libcurl.
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700315 if (!timeout_source_) {
Darin Petkovb83371f2010-08-17 09:34:49 -0700316 LOG(INFO) << "Setting up timeout source: " << idle_seconds_ << " seconds.";
317 timeout_source_ = g_timeout_source_new_seconds(idle_seconds_);
318 g_source_set_callback(timeout_source_, StaticTimeoutCallback, this, NULL);
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700319 g_source_attach(timeout_source_, NULL);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000320 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000321}
322
323bool LibcurlHttpFetcher::FDCallback(GIOChannel *source,
324 GIOCondition condition) {
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700325 CurlPerformOnce();
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700326 // We handle removing of this source elsewhere, so we always return true.
327 // The docs say, "the function should return FALSE if the event source
328 // should be removed."
329 // http://www.gtk.org/api/2.6/glib/glib-IO-Channels.html#GIOFunc
330 return true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000331}
332
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700333gboolean LibcurlHttpFetcher::RetryTimeoutCallback() {
334 ResumeTransfer(url_);
335 CurlPerformOnce();
336 return FALSE; // Don't have glib auto call this callback again
337}
338
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700339gboolean LibcurlHttpFetcher::TimeoutCallback() {
Andrew de los Reyescb319332010-07-19 10:55:01 -0700340 // We always return true, even if we don't want glib to call us back.
341 // We will remove the event source separately if we don't want to
342 // be called back.
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700343 if (!transfer_in_progress_)
344 return TRUE;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700345 CurlPerformOnce();
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700346 return TRUE;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000347}
348
349void LibcurlHttpFetcher::CleanUp() {
350 if (timeout_source_) {
351 g_source_destroy(timeout_source_);
352 timeout_source_ = NULL;
353 }
354
Darin Petkov60e14152010-10-27 16:57:04 -0700355 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
356 for (IOChannels::iterator it = io_channels_[t].begin();
357 it != io_channels_[t].end(); ++it) {
358 g_source_remove(it->second.second);
359 g_io_channel_unref(it->second.first);
360 }
361 io_channels_[t].clear();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000362 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000363
364 if (curl_handle_) {
365 if (curl_multi_handle_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000366 CHECK_EQ(curl_multi_remove_handle(curl_multi_handle_, curl_handle_),
367 CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000368 }
369 curl_easy_cleanup(curl_handle_);
370 curl_handle_ = NULL;
371 }
372 if (curl_multi_handle_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000373 CHECK_EQ(curl_multi_cleanup(curl_multi_handle_), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000374 curl_multi_handle_ = NULL;
375 }
376 transfer_in_progress_ = false;
377}
378
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700379void LibcurlHttpFetcher::GetHttpResponseCode() {
380 long http_response_code = 0;
381 if (curl_easy_getinfo(curl_handle_,
382 CURLINFO_RESPONSE_CODE,
383 &http_response_code) == CURLE_OK) {
384 http_response_code_ = static_cast<int>(http_response_code);
385 }
386}
387
rspangler@google.com49fdf182009-10-10 00:57:34 +0000388} // namespace chromeos_update_engine