blob: d5358bd252118b90efa4fd8219192c51d2cf77ca [file] [log] [blame]
rspangler@google.com49fdf182009-10-10 00:57:34 +00001// Copyright (c) 2009 The Chromium OS Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
rspangler@google.com49fdf182009-10-10 00:57:34 +00005#include "update_engine/libcurl_http_fetcher.h"
Andrew de los Reyesd57d1472010-10-21 13:34:08 -07006
adlr@google.comc98a7ed2009-12-04 18:54:03 +00007#include <algorithm>
Andrew de los Reyesd57d1472010-10-21 13:34:08 -07008#include <string>
9
10#include <base/logging.h>
11
12#include "update_engine/dbus_interface.h"
13#include "update_engine/flimflam_proxy.h"
14#include "update_engine/utils.h"
adlr@google.comc98a7ed2009-12-04 18:54:03 +000015
16using std::max;
17using std::make_pair;
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070018using std::string;
rspangler@google.com49fdf182009-10-10 00:57:34 +000019
20// This is a concrete implementation of HttpFetcher that uses libcurl to do the
21// http work.
22
23namespace chromeos_update_engine {
24
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -070025namespace {
26const int kMaxRetriesCount = 20;
Darin Petkov3a4016a2010-09-28 13:54:17 -070027const char kCACertificatesPath[] = "/usr/share/update_engine/ca-certificates";
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070028} // namespace {}
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -070029
rspangler@google.com49fdf182009-10-10 00:57:34 +000030LibcurlHttpFetcher::~LibcurlHttpFetcher() {
31 CleanUp();
32}
33
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070034// On error, returns false.
35bool LibcurlHttpFetcher::ConnectionIsExpensive() const {
36 if (force_connection_type_)
37 return forced_expensive_connection_;
38 NetworkConnectionType type;
39 ConcreteDbusGlib dbus_iface;
40 TEST_AND_RETURN_FALSE(FlimFlamProxy::GetConnectionType(&dbus_iface, &type));
41 LOG(INFO) << "We are connected via "
42 << FlimFlamProxy::StringForConnectionType(type);
43 return FlimFlamProxy::IsExpensiveConnectionType(type);
44}
45
Darin Petkovfc7a0ce2010-10-25 10:38:37 -070046bool LibcurlHttpFetcher::IsOfficialBuild() const {
47 return force_build_type_ ? forced_official_build_ : utils::IsOfficialBuild();
48}
49
adlr@google.comc98a7ed2009-12-04 18:54:03 +000050void LibcurlHttpFetcher::ResumeTransfer(const std::string& url) {
Andrew de los Reyes3270f742010-07-15 22:28:14 -070051 LOG(INFO) << "Starting/Resuming transfer";
rspangler@google.com49fdf182009-10-10 00:57:34 +000052 CHECK(!transfer_in_progress_);
53 url_ = url;
54 curl_multi_handle_ = curl_multi_init();
55 CHECK(curl_multi_handle_);
56
57 curl_handle_ = curl_easy_init();
58 CHECK(curl_handle_);
59
60 if (post_data_set_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +000061 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POST, 1), CURLE_OK);
62 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POSTFIELDS,
63 &post_data_[0]),
64 CURLE_OK);
65 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_POSTFIELDSIZE,
66 post_data_.size()),
67 CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +000068 }
69
adlr@google.comc98a7ed2009-12-04 18:54:03 +000070 if (bytes_downloaded_ > 0) {
71 // Resume from where we left off
72 resume_offset_ = bytes_downloaded_;
73 CHECK_EQ(curl_easy_setopt(curl_handle_,
74 CURLOPT_RESUME_FROM_LARGE,
75 bytes_downloaded_), CURLE_OK);
76 }
77
78 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_WRITEDATA, this), CURLE_OK);
79 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_WRITEFUNCTION,
80 StaticLibcurlWrite), CURLE_OK);
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070081
82 string url_to_use(url_);
83 if (ConnectionIsExpensive()) {
84 LOG(INFO) << "Not initiating HTTP connection b/c we are on an expensive"
85 << " connection";
86 url_to_use = ""; // Sabotage the URL
87 }
88
Darin Petkovfc7a0ce2010-10-25 10:38:37 -070089 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_URL, url_to_use.c_str()),
Andrew de los Reyesd57d1472010-10-21 13:34:08 -070090 CURLE_OK);
Andrew de los Reyes3270f742010-07-15 22:28:14 -070091
Darin Petkov192ced42010-07-23 16:20:24 -070092 // If the connection drops under 10 bytes/sec for 3 minutes, reconnect.
Andrew de los Reyes3270f742010-07-15 22:28:14 -070093 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_LOW_SPEED_LIMIT, 10),
94 CURLE_OK);
Darin Petkov192ced42010-07-23 16:20:24 -070095 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_LOW_SPEED_TIME, 3 * 60),
Andrew de los Reyes3270f742010-07-15 22:28:14 -070096 CURLE_OK);
97
Darin Petkov41c2fcf2010-08-25 13:14:48 -070098 // By default, libcurl doesn't follow redirections. Allow up to
99 // |kMaxRedirects| redirections.
Darin Petkov3a4016a2010-09-28 13:54:17 -0700100 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_FOLLOWLOCATION, 1), CURLE_OK);
Darin Petkov41c2fcf2010-08-25 13:14:48 -0700101 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_MAXREDIRS, kMaxRedirects),
102 CURLE_OK);
103
Darin Petkove237d192010-11-16 10:26:08 -0800104 // Security lock-down in official builds: makes sure that peer certificate
105 // verification is enabled, restricts the set of trusted certificates,
106 // restricts protocols to HTTPS, restricts ciphers to HIGH.
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700107 if (IsOfficialBuild()) {
Darin Petkove237d192010-11-16 10:26:08 -0800108 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_SSL_VERIFYPEER, 1),
109 CURLE_OK);
110 CHECK_EQ(curl_easy_setopt(curl_handle_,
111 CURLOPT_CAPATH,
112 kCACertificatesPath),
113 CURLE_OK);
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700114 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_PROTOCOLS, CURLPROTO_HTTPS),
115 CURLE_OK);
116 CHECK_EQ(curl_easy_setopt(curl_handle_,
117 CURLOPT_REDIR_PROTOCOLS,
118 CURLPROTO_HTTPS),
119 CURLE_OK);
Darin Petkove237d192010-11-16 10:26:08 -0800120 CHECK_EQ(curl_easy_setopt(curl_handle_, CURLOPT_SSL_CIPHER_LIST, "HIGH"),
121 CURLE_OK);
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700122 }
123
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000124 CHECK_EQ(curl_multi_add_handle(curl_multi_handle_, curl_handle_), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000125 transfer_in_progress_ = true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000126}
127
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000128// Begins the transfer, which must not have already been started.
129void LibcurlHttpFetcher::BeginTransfer(const std::string& url) {
130 transfer_size_ = -1;
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000131 resume_offset_ = 0;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700132 retry_count_ = 0;
Darin Petkovcb466212010-08-26 09:40:11 -0700133 http_response_code_ = 0;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700134 ResumeTransfer(url);
135 CurlPerformOnce();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000136}
137
rspangler@google.com49fdf182009-10-10 00:57:34 +0000138void LibcurlHttpFetcher::TerminateTransfer() {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700139 if (in_write_callback_)
140 terminate_requested_ = true;
141 else
142 CleanUp();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000143}
144
Andrew de los Reyescb319332010-07-19 10:55:01 -0700145void LibcurlHttpFetcher::CurlPerformOnce() {
rspangler@google.com49fdf182009-10-10 00:57:34 +0000146 CHECK(transfer_in_progress_);
147 int running_handles = 0;
148 CURLMcode retcode = CURLM_CALL_MULTI_PERFORM;
149
150 // libcurl may request that we immediately call curl_multi_perform after it
151 // returns, so we do. libcurl promises that curl_multi_perform will not block.
152 while (CURLM_CALL_MULTI_PERFORM == retcode) {
153 retcode = curl_multi_perform(curl_multi_handle_, &running_handles);
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700154 if (terminate_requested_) {
155 CleanUp();
156 return;
157 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000158 }
159 if (0 == running_handles) {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700160 GetHttpResponseCode();
161 if (http_response_code_) {
162 LOG(INFO) << "HTTP response code: " << http_response_code_;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700163 } else {
164 LOG(ERROR) << "Unable to get http response code.";
165 }
Darin Petkov192ced42010-07-23 16:20:24 -0700166
rspangler@google.com49fdf182009-10-10 00:57:34 +0000167 // we're done!
168 CleanUp();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000169
170 if ((transfer_size_ >= 0) && (bytes_downloaded_ < transfer_size_)) {
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700171 // Need to restart transfer
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700172 retry_count_++;
173 LOG(INFO) << "Restarting transfer b/c we finished, had downloaded "
174 << bytes_downloaded_ << " bytes, but transfer_size_ is "
175 << transfer_size_ << ". retry_count: " << retry_count_;
176 if (retry_count_ > kMaxRetriesCount) {
177 if (delegate_)
178 delegate_->TransferComplete(this, false); // success
179 } else {
Darin Petkovb83371f2010-08-17 09:34:49 -0700180 g_timeout_add_seconds(retry_seconds_,
Darin Petkov9b111652010-08-16 11:46:25 -0700181 &LibcurlHttpFetcher::StaticRetryTimeoutCallback,
182 this);
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700183 }
Andrew de los Reyescb319332010-07-19 10:55:01 -0700184 return;
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000185 } else {
186 if (delegate_) {
Andrew de los Reyesfb4ad7d2010-07-19 10:43:46 -0700187 // success is when http_response_code is 2xx
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700188 bool success = (http_response_code_ >= 200) &&
189 (http_response_code_ < 300);
Andrew de los Reyesfb4ad7d2010-07-19 10:43:46 -0700190 delegate_->TransferComplete(this, success);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000191 }
192 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000193 } else {
194 // set up callback
195 SetupMainloopSources();
196 }
197}
198
199size_t LibcurlHttpFetcher::LibcurlWrite(void *ptr, size_t size, size_t nmemb) {
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700200 GetHttpResponseCode();
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000201 {
202 double transfer_size_double;
203 CHECK_EQ(curl_easy_getinfo(curl_handle_,
204 CURLINFO_CONTENT_LENGTH_DOWNLOAD,
205 &transfer_size_double), CURLE_OK);
206 off_t new_transfer_size = static_cast<off_t>(transfer_size_double);
207 if (new_transfer_size > 0) {
208 transfer_size_ = resume_offset_ + new_transfer_size;
209 }
210 }
211 bytes_downloaded_ += size * nmemb;
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700212 in_write_callback_ = true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000213 if (delegate_)
214 delegate_->ReceivedBytes(this, reinterpret_cast<char*>(ptr), size * nmemb);
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700215 in_write_callback_ = false;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000216 return size * nmemb;
217}
218
219void LibcurlHttpFetcher::Pause() {
220 CHECK(curl_handle_);
221 CHECK(transfer_in_progress_);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000222 CHECK_EQ(curl_easy_pause(curl_handle_, CURLPAUSE_ALL), CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000223}
224
225void LibcurlHttpFetcher::Unpause() {
226 CHECK(curl_handle_);
227 CHECK(transfer_in_progress_);
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000228 CHECK_EQ(curl_easy_pause(curl_handle_, CURLPAUSE_CONT), CURLE_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000229}
230
231// This method sets up callbacks with the glib main loop.
232void LibcurlHttpFetcher::SetupMainloopSources() {
233 fd_set fd_read;
234 fd_set fd_write;
Darin Petkov60e14152010-10-27 16:57:04 -0700235 fd_set fd_exc;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000236
237 FD_ZERO(&fd_read);
238 FD_ZERO(&fd_write);
Darin Petkov60e14152010-10-27 16:57:04 -0700239 FD_ZERO(&fd_exc);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000240
241 int fd_max = 0;
242
243 // Ask libcurl for the set of file descriptors we should track on its
244 // behalf.
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000245 CHECK_EQ(curl_multi_fdset(curl_multi_handle_, &fd_read, &fd_write,
Darin Petkov60e14152010-10-27 16:57:04 -0700246 &fd_exc, &fd_max), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000247
248 // We should iterate through all file descriptors up to libcurl's fd_max or
Darin Petkov60e14152010-10-27 16:57:04 -0700249 // the highest one we're tracking, whichever is larger.
250 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
251 if (!io_channels_[t].empty())
252 fd_max = max(fd_max, io_channels_[t].rbegin()->first);
253 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000254
Darin Petkov60e14152010-10-27 16:57:04 -0700255 // For each fd, if we're not tracking it, track it. If we are tracking it, but
256 // libcurl doesn't care about it anymore, stop tracking it. After this loop,
257 // there should be exactly as many GIOChannel objects in io_channels_[0|1] as
258 // there are read/write fds that we're tracking.
259 for (int fd = 0; fd <= fd_max; ++fd) {
260 // Note that fd_exc is unused in the current version of libcurl so is_exc
261 // should always be false.
262 bool is_exc = FD_ISSET(fd, &fd_exc) != 0;
263 bool must_track[2] = {
264 is_exc || (FD_ISSET(fd, &fd_read) != 0), // track 0 -- read
265 is_exc || (FD_ISSET(fd, &fd_write) != 0) // track 1 -- write
266 };
267
268 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
269 bool tracked = io_channels_[t].find(fd) != io_channels_[t].end();
270
271 if (!must_track[t]) {
272 // If we have an outstanding io_channel, remove it.
273 if (tracked) {
274 g_source_remove(io_channels_[t][fd].second);
275 g_io_channel_unref(io_channels_[t][fd].first);
276 io_channels_[t].erase(io_channels_[t].find(fd));
277 }
278 continue;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000279 }
Darin Petkov60e14152010-10-27 16:57:04 -0700280
281 // If we are already tracking this fd, continue -- nothing to do.
282 if (tracked)
283 continue;
284
285 // Set conditions appropriately -- read for track 0, write for track 1.
286 GIOCondition condition = static_cast<GIOCondition>(
287 ((t == 0) ? (G_IO_IN | G_IO_PRI) : G_IO_OUT) | G_IO_ERR | G_IO_HUP);
288
289 // Track a new fd.
290 GIOChannel* io_channel = g_io_channel_unix_new(fd);
291 guint tag =
292 g_io_add_watch(io_channel, condition, &StaticFDCallback, this);
293
294 io_channels_[t][fd] = make_pair(io_channel, tag);
295 static int io_counter = 0;
296 io_counter++;
297 if (io_counter % 50 == 0) {
298 LOG(INFO) << "io_counter = " << io_counter;
299 }
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700300 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000301 }
302
Darin Petkovb83371f2010-08-17 09:34:49 -0700303 // Set up a timeout callback for libcurl.
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700304 if (!timeout_source_) {
Darin Petkovb83371f2010-08-17 09:34:49 -0700305 LOG(INFO) << "Setting up timeout source: " << idle_seconds_ << " seconds.";
306 timeout_source_ = g_timeout_source_new_seconds(idle_seconds_);
307 g_source_set_callback(timeout_source_, StaticTimeoutCallback, this, NULL);
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700308 g_source_attach(timeout_source_, NULL);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000309 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000310}
311
312bool LibcurlHttpFetcher::FDCallback(GIOChannel *source,
313 GIOCondition condition) {
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700314 CurlPerformOnce();
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700315 // We handle removing of this source elsewhere, so we always return true.
316 // The docs say, "the function should return FALSE if the event source
317 // should be removed."
318 // http://www.gtk.org/api/2.6/glib/glib-IO-Channels.html#GIOFunc
319 return true;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000320}
321
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700322gboolean LibcurlHttpFetcher::RetryTimeoutCallback() {
323 ResumeTransfer(url_);
324 CurlPerformOnce();
325 return FALSE; // Don't have glib auto call this callback again
326}
327
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700328gboolean LibcurlHttpFetcher::TimeoutCallback() {
Andrew de los Reyescb319332010-07-19 10:55:01 -0700329 // We always return true, even if we don't want glib to call us back.
330 // We will remove the event source separately if we don't want to
331 // be called back.
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700332 if (!transfer_in_progress_)
333 return TRUE;
Andrew de los Reyes9bbd1872010-07-16 14:52:29 -0700334 CurlPerformOnce();
Andrew de los Reyes3270f742010-07-15 22:28:14 -0700335 return TRUE;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000336}
337
338void LibcurlHttpFetcher::CleanUp() {
339 if (timeout_source_) {
340 g_source_destroy(timeout_source_);
341 timeout_source_ = NULL;
342 }
343
Darin Petkov60e14152010-10-27 16:57:04 -0700344 for (size_t t = 0; t < arraysize(io_channels_); ++t) {
345 for (IOChannels::iterator it = io_channels_[t].begin();
346 it != io_channels_[t].end(); ++it) {
347 g_source_remove(it->second.second);
348 g_io_channel_unref(it->second.first);
349 }
350 io_channels_[t].clear();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000351 }
rspangler@google.com49fdf182009-10-10 00:57:34 +0000352
353 if (curl_handle_) {
354 if (curl_multi_handle_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000355 CHECK_EQ(curl_multi_remove_handle(curl_multi_handle_, curl_handle_),
356 CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000357 }
358 curl_easy_cleanup(curl_handle_);
359 curl_handle_ = NULL;
360 }
361 if (curl_multi_handle_) {
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000362 CHECK_EQ(curl_multi_cleanup(curl_multi_handle_), CURLM_OK);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000363 curl_multi_handle_ = NULL;
364 }
365 transfer_in_progress_ = false;
366}
367
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700368void LibcurlHttpFetcher::GetHttpResponseCode() {
369 long http_response_code = 0;
370 if (curl_easy_getinfo(curl_handle_,
371 CURLINFO_RESPONSE_CODE,
372 &http_response_code) == CURLE_OK) {
373 http_response_code_ = static_cast<int>(http_response_code);
374 }
375}
376
rspangler@google.com49fdf182009-10-10 00:57:34 +0000377} // namespace chromeos_update_engine