blob: cdd489d64a4407f81cfb318531308548bc3673e6 [file] [log] [blame]
Alex Deymoaea4c1c2015-08-19 20:24:43 -07001//
2// Copyright (C) 2009 The Android Open Source Project
3//
4// Licensed under the Apache License, Version 2.0 (the "License");
5// you may not use this file except in compliance with the License.
6// You may obtain a copy of the License at
7//
8// http://www.apache.org/licenses/LICENSE-2.0
9//
10// Unless required by applicable law or agreed to in writing, software
11// distributed under the License is distributed on an "AS IS" BASIS,
12// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13// See the License for the specific language governing permissions and
14// limitations under the License.
15//
rspangler@google.com49fdf182009-10-10 00:57:34 +000016
Alex Deymo14c0da82016-07-20 16:45:45 -070017#ifndef UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
18#define UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
rspangler@google.com49fdf182009-10-10 00:57:34 +000019
20#include <map>
Alex Deymoc1c17b42015-11-23 03:53:15 -030021#include <memory>
rspangler@google.com49fdf182009-10-10 00:57:34 +000022#include <string>
Alex Vakulenkod2779df2014-06-16 13:19:00 -070023#include <utility>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070024
rspangler@google.com49fdf182009-10-10 00:57:34 +000025#include <curl/curl.h>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070026
Ben Chan05735a12014-09-03 07:48:22 -070027#include <base/logging.h>
28#include <base/macros.h>
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -070029#include <brillo/message_loops/message_loop.h>
Ben Chan05735a12014-09-03 07:48:22 -070030
Alex Deymo14c0da82016-07-20 16:45:45 -070031#include "update_engine/certificate_checker.h"
Alex Deymo39910dc2015-11-09 17:04:30 -080032#include "update_engine/common/hardware_interface.h"
33#include "update_engine/common/http_fetcher.h"
Jay Srinivasan43488792012-06-19 00:25:31 -070034
rspangler@google.com49fdf182009-10-10 00:57:34 +000035// This is a concrete implementation of HttpFetcher that uses libcurl to do the
36// http work.
37
38namespace chromeos_update_engine {
39
Xiaochu Liub5ba7972019-07-11 09:51:06 -070040// |UnresolvedHostStateMachine| is a representation of internal state machine of
41// |LibcurlHttpFetcher|.
42class UnresolvedHostStateMachine {
43 public:
44 UnresolvedHostStateMachine() = default;
45 enum class State {
46 kInit = 0,
47 kRetry = 1,
48 kRetriedSuccess = 2,
49 kNotRetry = 3,
50 };
51
52 State getState() { return state_; }
53
54 // Updates the following internal state machine:
55 //
56 // |kInit|
57 // |
58 // |
59 // \/
60 // (Try, host Unresolved)
61 // |
62 // |
63 // \/
64 // |kRetry| --> (Retry, host resolved)
65 // | |
66 // | |
67 // \/ \/
68 // (Retry, host Unresolved) |kRetriedSuccess|
69 // |
70 // |
71 // \/
72 // |kNotRetry|
73 //
74 void UpdateState(bool failed_to_resolve_host);
75
76 private:
77 State state_ = {State::kInit};
78
79 DISALLOW_COPY_AND_ASSIGN(UnresolvedHostStateMachine);
80};
81
rspangler@google.com49fdf182009-10-10 00:57:34 +000082class LibcurlHttpFetcher : public HttpFetcher {
83 public:
Jay Srinivasan43488792012-06-19 00:25:31 -070084 LibcurlHttpFetcher(ProxyResolver* proxy_resolver,
Alex Deymo33e91e72015-12-01 18:26:08 -030085 HardwareInterface* hardware);
rspangler@google.com49fdf182009-10-10 00:57:34 +000086
87 // Cleans up all internal state. Does not notify delegate
Alex Deymo610277e2014-11-11 21:18:11 -080088 ~LibcurlHttpFetcher() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000089
Alex Deymo610277e2014-11-11 21:18:11 -080090 void SetOffset(off_t offset) override { bytes_downloaded_ = offset; }
Gilad Arnolde4ad2502011-12-29 17:08:54 -080091
Alex Deymo610277e2014-11-11 21:18:11 -080092 void SetLength(size_t length) override { download_length_ = length; }
93 void UnsetLength() override { SetLength(0); }
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -070094
rspangler@google.com49fdf182009-10-10 00:57:34 +000095 // Begins the transfer if it hasn't already begun.
Alex Deymo610277e2014-11-11 21:18:11 -080096 void BeginTransfer(const std::string& url) override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000097
Darin Petkov9ce452b2010-11-17 14:33:28 -080098 // If the transfer is in progress, aborts the transfer early. The transfer
99 // cannot be resumed.
Alex Deymo610277e2014-11-11 21:18:11 -0800100 void TerminateTransfer() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000101
Alex Deymofdd6dec2016-03-03 22:35:43 -0800102 // Pass the headers to libcurl.
103 void SetHeader(const std::string& header_name,
104 const std::string& header_value) override;
105
Jae Hoon Kim0ae8fe12019-06-26 14:32:50 -0700106 bool GetHeader(const std::string& header_name,
107 std::string* header_value) const override;
108
rspangler@google.com49fdf182009-10-10 00:57:34 +0000109 // Suspend the transfer by calling curl_easy_pause(CURLPAUSE_ALL).
Alex Deymo610277e2014-11-11 21:18:11 -0800110 void Pause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000111
112 // Resume the transfer by calling curl_easy_pause(CURLPAUSE_CONT).
Alex Deymo610277e2014-11-11 21:18:11 -0800113 void Unpause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000114
115 // Libcurl sometimes asks to be called back after some time while
116 // leaving that time unspecified. In that case, we pick a reasonable
117 // default of one second, but it can be overridden here. This is
118 // primarily useful for testing.
119 // From http://curl.haxx.se/libcurl/c/curl_multi_timeout.html:
120 // if libcurl returns a -1 timeout here, it just means that libcurl
121 // currently has no stored timeout value. You must not wait too long
122 // (more than a few seconds perhaps) before you call
123 // curl_multi_perform() again.
Alex Deymo610277e2014-11-11 21:18:11 -0800124 void set_idle_seconds(int seconds) override { idle_seconds_ = seconds; }
Darin Petkovb83371f2010-08-17 09:34:49 -0700125
126 // Sets the retry timeout. Useful for testing.
Alex Deymo610277e2014-11-11 21:18:11 -0800127 void set_retry_seconds(int seconds) override { retry_seconds_ = seconds; }
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700128
Darin Petkova0929552010-11-29 14:19:06 -0800129 void set_no_network_max_retries(int retries) {
130 no_network_max_retries_ = retries;
131 }
132
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700133 int get_no_network_max_retries() { return no_network_max_retries_; }
134
Alex Deymo33e91e72015-12-01 18:26:08 -0300135 void set_server_to_check(ServerToCheck server_to_check) {
136 server_to_check_ = server_to_check;
137 }
138
Alex Deymo610277e2014-11-11 21:18:11 -0800139 size_t GetBytesDownloaded() override {
Gilad Arnold48085ba2011-11-16 09:36:08 -0800140 return static_cast<size_t>(bytes_downloaded_);
141 }
142
Alex Deymo610277e2014-11-11 21:18:11 -0800143 void set_low_speed_limit(int low_speed_bps, int low_speed_sec) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700144 low_speed_limit_bps_ = low_speed_bps;
145 low_speed_time_seconds_ = low_speed_sec;
146 }
147
Alex Deymo610277e2014-11-11 21:18:11 -0800148 void set_connect_timeout(int connect_timeout_seconds) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700149 connect_timeout_seconds_ = connect_timeout_seconds;
150 }
151
Alex Deymo610277e2014-11-11 21:18:11 -0800152 void set_max_retry_count(int max_retry_count) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700153 max_retry_count_ = max_retry_count;
154 }
155
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700156 void set_is_update_check(bool is_update_check) {
157 is_update_check_ = is_update_check;
158 }
159
rspangler@google.com49fdf182009-10-10 00:57:34 +0000160 private:
Alex Deymo13e95182017-03-16 19:06:13 -0700161 // libcurl's CURLOPT_CLOSESOCKETFUNCTION callback function. Called when
162 // closing a socket created with the CURLOPT_OPENSOCKETFUNCTION callback.
163 static int LibcurlCloseSocketCallback(void* clientp, curl_socket_t item);
164
Andrew de los Reyesf3ed8e72011-02-16 10:35:46 -0800165 // Callback for when proxy resolution has completed. This begins the
166 // transfer.
167 void ProxiesResolved();
Jay Srinivasan43488792012-06-19 00:25:31 -0700168
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700169 // Asks libcurl for the http response code and stores it in the object.
170 void GetHttpResponseCode();
171
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700172 // Returns the last |CURLcode|.
173 CURLcode GetCurlCode();
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700174
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800175 // Checks whether stored HTTP response is within the success range.
Gilad Arnold48085ba2011-11-16 09:36:08 -0800176 inline bool IsHttpResponseSuccess() {
177 return (http_response_code_ >= 200 && http_response_code_ < 300);
178 }
179
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800180 // Checks whether stored HTTP response is within the error range. This
181 // includes both errors with the request (4xx) and server errors (5xx).
182 inline bool IsHttpResponseError() {
183 return (http_response_code_ >= 400 && http_response_code_ < 600);
184 }
185
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000186 // Resumes a transfer where it left off. This will use the
187 // HTTP Range: header to make a new connection from where the last
188 // left off.
189 virtual void ResumeTransfer(const std::string& url);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000190
Alex Deymo60ca1a72015-06-18 18:19:15 -0700191 void TimeoutCallback();
192 void RetryTimeoutCallback();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000193
194 // Calls into curl_multi_perform to let libcurl do its work. Returns after
195 // curl_multi_perform is finished, which may actually be after more than
Alex Deymo0b3db6b2015-08-10 15:19:37 -0700196 // one call to curl_multi_perform. This method will set up the message
Alex Deymof2858572016-02-25 11:20:13 -0800197 // loop with sources for future work that libcurl will do, if any, or complete
198 // the transfer and finish the action if no work left to do.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000199 // This method will not block.
Andrew de los Reyescb319332010-07-19 10:55:01 -0700200 void CurlPerformOnce();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000201
Alex Deymo29b81532015-07-09 11:51:49 -0700202 // Sets up message loop sources as needed by libcurl. This is generally
rspangler@google.com49fdf182009-10-10 00:57:34 +0000203 // the file descriptor of the socket and a timer in case nothing happens
204 // on the fds.
Alex Deymo29b81532015-07-09 11:51:49 -0700205 void SetupMessageLoopSources();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000206
207 // Callback called by libcurl when new data has arrived on the transfer
Amin Hassani7cc8bb02019-01-14 16:29:47 -0800208 size_t LibcurlWrite(void* ptr, size_t size, size_t nmemb);
209 static size_t StaticLibcurlWrite(void* ptr,
210 size_t size,
211 size_t nmemb,
212 void* stream) {
213 return reinterpret_cast<LibcurlHttpFetcher*>(stream)->LibcurlWrite(
214 ptr, size, nmemb);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000215 }
216
217 // Cleans up the following if they are non-null:
Alex Deymo29b81532015-07-09 11:51:49 -0700218 // curl(m) handles, fd_task_maps_, timeout_id_.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000219 void CleanUp();
220
Darin Petkov9ce452b2010-11-17 14:33:28 -0800221 // Force terminate the transfer. This will invoke the delegate's (if any)
222 // TransferTerminated callback so, after returning, this fetcher instance may
223 // be destroyed.
224 void ForceTransferTermination();
225
Jay Srinivasanb3f55402012-12-03 18:12:04 -0800226 // Sets the curl options for HTTP URL.
227 void SetCurlOptionsForHttp();
228
229 // Sets the curl options for HTTPS URL.
230 void SetCurlOptionsForHttps();
231
Alex Deymo56ccb072016-02-05 00:50:48 -0800232 // Sets the curl options for file URI.
233 void SetCurlOptionsForFile();
234
Gilad Arnold59d9e012013-07-23 16:41:43 -0700235 // Convert a proxy URL into a curl proxy type, if applicable. Returns true iff
236 // conversion was successful, false otherwise (in which case nothing is
237 // written to |out_type|).
238 bool GetProxyType(const std::string& proxy, curl_proxytype* out_type);
239
Alex Deymoc1c17b42015-11-23 03:53:15 -0300240 // Hardware interface used to query dev-mode and official build settings.
241 HardwareInterface* hardware_;
242
rspangler@google.com49fdf182009-10-10 00:57:34 +0000243 // Handles for the libcurl library
Alex Deymo60ca1a72015-06-18 18:19:15 -0700244 CURLM* curl_multi_handle_{nullptr};
245 CURL* curl_handle_{nullptr};
246 struct curl_slist* curl_http_headers_{nullptr};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000247
Alex Deymofdd6dec2016-03-03 22:35:43 -0800248 // The extra headers that will be sent on each request.
249 std::map<std::string, std::string> extra_headers_;
250
Darin Petkov60e14152010-10-27 16:57:04 -0700251 // Lists of all read(0)/write(1) file descriptors that we're waiting on from
Alex Deymo29b81532015-07-09 11:51:49 -0700252 // the message loop. libcurl may open/close descriptors and switch their
Darin Petkov60e14152010-10-27 16:57:04 -0700253 // directions so maintain two separate lists so that watch conditions can be
254 // set appropriately.
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -0700255 std::map<int, brillo::MessageLoop::TaskId> fd_task_maps_[2];
rspangler@google.com49fdf182009-10-10 00:57:34 +0000256
Alex Deymo60ca1a72015-06-18 18:19:15 -0700257 // The TaskId of the timer we're waiting on. kTaskIdNull if we are not waiting
258 // on it.
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -0700259 brillo::MessageLoop::TaskId timeout_id_{brillo::MessageLoop::kTaskIdNull};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000260
Alex Deymo29b81532015-07-09 11:51:49 -0700261 bool transfer_in_progress_{false};
Alex Deymof2858572016-02-25 11:20:13 -0800262 bool transfer_paused_{false};
263
264 // Whether it should ignore transfer failures for the purpose of retrying the
265 // connection.
266 bool ignore_failure_{false};
267
268 // Whether we should restart the transfer once Unpause() is called. This can
269 // be caused because either the connection dropped while pause or the proxy
270 // was resolved and we never started the transfer in the first place.
271 bool restart_transfer_on_unpause_{false};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000272
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000273 // The transfer size. -1 if not known.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700274 off_t transfer_size_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000275
276 // How many bytes have been downloaded and sent to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700277 off_t bytes_downloaded_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000278
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800279 // The remaining maximum number of bytes to download. Zero represents an
280 // unspecified length.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700281 size_t download_length_{0};
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800282
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000283 // If we resumed an earlier transfer, data offset that we used for the
284 // new connection. 0 otherwise.
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700285 // In this class, resume refers to resuming a dropped HTTP connection,
286 // not to resuming an interrupted download.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700287 off_t resume_offset_{0};
Darin Petkovb83371f2010-08-17 09:34:49 -0700288
Jay Srinivasan32f23572012-06-05 13:45:07 -0700289 // Number of resumes performed so far and the max allowed.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700290 int retry_count_{0};
291 int max_retry_count_{kDownloadMaxRetryCount};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000292
Darin Petkovb83371f2010-08-17 09:34:49 -0700293 // Seconds to wait before retrying a resume.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700294 int retry_seconds_{20};
Darin Petkovb83371f2010-08-17 09:34:49 -0700295
Alex Deymob20de692017-02-05 07:47:37 +0000296 // When waiting for a retry, the task id of the retry callback.
297 brillo::MessageLoop::TaskId retry_task_id_{brillo::MessageLoop::kTaskIdNull};
298
Darin Petkova0929552010-11-29 14:19:06 -0800299 // Number of resumes due to no network (e.g., HTTP response code 0).
Alex Deymo60ca1a72015-06-18 18:19:15 -0700300 int no_network_retry_count_{0};
301 int no_network_max_retries_{0};
Darin Petkova0929552010-11-29 14:19:06 -0800302
Darin Petkovb83371f2010-08-17 09:34:49 -0700303 // Seconds to wait before asking libcurl to "perform".
Alex Deymo60ca1a72015-06-18 18:19:15 -0700304 int idle_seconds_{1};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700305
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700306 // If true, we are currently performing a write callback on the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700307 bool in_write_callback_{false};
Darin Petkova0929552010-11-29 14:19:06 -0800308
Andrew de los Reyes45168102010-11-22 11:13:50 -0800309 // If true, we have returned at least one byte in the write callback
310 // to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700311 bool sent_byte_{false};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700312
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700313 // We can't clean everything up while we're in a write callback, so
314 // if we get a terminate request, queue it until we can handle it.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700315 bool terminate_requested_{false};
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700316
Alex Deymo33e91e72015-12-01 18:26:08 -0300317 // The ServerToCheck used when checking this connection's certificate. If no
318 // certificate check needs to be performed, this should be set to
319 // ServerToCheck::kNone.
320 ServerToCheck server_to_check_{ServerToCheck::kNone};
Bruno Rocha7f9aea22011-09-12 14:31:24 -0700321
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700322 // True if this object is for update check.
323 bool is_update_check_{false};
324
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700325 // Internal state machine.
326 UnresolvedHostStateMachine unresolved_host_state_machine_;
327
Alex Deymo60ca1a72015-06-18 18:19:15 -0700328 int low_speed_limit_bps_{kDownloadLowSpeedLimitBps};
329 int low_speed_time_seconds_{kDownloadLowSpeedTimeSeconds};
330 int connect_timeout_seconds_{kDownloadConnectTimeoutSeconds};
David Zeuthen34135a92013-08-06 11:16:16 -0700331
rspangler@google.com49fdf182009-10-10 00:57:34 +0000332 DISALLOW_COPY_AND_ASSIGN(LibcurlHttpFetcher);
333};
334
335} // namespace chromeos_update_engine
336
Alex Deymo14c0da82016-07-20 16:45:45 -0700337#endif // UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_