blob: 4e91b6930a7452affba0d83f00a9bf15237c50ee [file] [log] [blame]
Alex Deymoaea4c1c2015-08-19 20:24:43 -07001//
2// Copyright (C) 2009 The Android Open Source Project
3//
4// Licensed under the Apache License, Version 2.0 (the "License");
5// you may not use this file except in compliance with the License.
6// You may obtain a copy of the License at
7//
8// http://www.apache.org/licenses/LICENSE-2.0
9//
10// Unless required by applicable law or agreed to in writing, software
11// distributed under the License is distributed on an "AS IS" BASIS,
12// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13// See the License for the specific language governing permissions and
14// limitations under the License.
15//
rspangler@google.com49fdf182009-10-10 00:57:34 +000016
Alex Deymo14c0da82016-07-20 16:45:45 -070017#ifndef UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
18#define UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
rspangler@google.com49fdf182009-10-10 00:57:34 +000019
20#include <map>
Alex Deymoc1c17b42015-11-23 03:53:15 -030021#include <memory>
rspangler@google.com49fdf182009-10-10 00:57:34 +000022#include <string>
Alex Vakulenkod2779df2014-06-16 13:19:00 -070023#include <utility>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070024
rspangler@google.com49fdf182009-10-10 00:57:34 +000025#include <curl/curl.h>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070026
Hidehiko Abe493fecb2019-07-10 23:30:50 +090027#include <base/files/file_descriptor_watcher_posix.h>
Ben Chan05735a12014-09-03 07:48:22 -070028#include <base/logging.h>
29#include <base/macros.h>
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -070030#include <brillo/message_loops/message_loop.h>
Ben Chan05735a12014-09-03 07:48:22 -070031
Alex Deymo14c0da82016-07-20 16:45:45 -070032#include "update_engine/certificate_checker.h"
Alex Deymo39910dc2015-11-09 17:04:30 -080033#include "update_engine/common/hardware_interface.h"
34#include "update_engine/common/http_fetcher.h"
Jay Srinivasan43488792012-06-19 00:25:31 -070035
rspangler@google.com49fdf182009-10-10 00:57:34 +000036// This is a concrete implementation of HttpFetcher that uses libcurl to do the
37// http work.
38
39namespace chromeos_update_engine {
40
Xiaochu Liub5ba7972019-07-11 09:51:06 -070041// |UnresolvedHostStateMachine| is a representation of internal state machine of
42// |LibcurlHttpFetcher|.
43class UnresolvedHostStateMachine {
44 public:
45 UnresolvedHostStateMachine() = default;
46 enum class State {
47 kInit = 0,
48 kRetry = 1,
49 kRetriedSuccess = 2,
50 kNotRetry = 3,
51 };
52
Amin Hassanid3d84212019-08-17 00:27:44 -070053 State GetState() { return state_; }
Xiaochu Liub5ba7972019-07-11 09:51:06 -070054
55 // Updates the following internal state machine:
56 //
57 // |kInit|
58 // |
59 // |
60 // \/
61 // (Try, host Unresolved)
62 // |
63 // |
64 // \/
65 // |kRetry| --> (Retry, host resolved)
66 // | |
67 // | |
68 // \/ \/
69 // (Retry, host Unresolved) |kRetriedSuccess|
70 // |
71 // |
72 // \/
73 // |kNotRetry|
74 //
75 void UpdateState(bool failed_to_resolve_host);
76
77 private:
78 State state_ = {State::kInit};
79
80 DISALLOW_COPY_AND_ASSIGN(UnresolvedHostStateMachine);
81};
82
rspangler@google.com49fdf182009-10-10 00:57:34 +000083class LibcurlHttpFetcher : public HttpFetcher {
84 public:
Jay Srinivasan43488792012-06-19 00:25:31 -070085 LibcurlHttpFetcher(ProxyResolver* proxy_resolver,
Alex Deymo33e91e72015-12-01 18:26:08 -030086 HardwareInterface* hardware);
rspangler@google.com49fdf182009-10-10 00:57:34 +000087
88 // Cleans up all internal state. Does not notify delegate
Alex Deymo610277e2014-11-11 21:18:11 -080089 ~LibcurlHttpFetcher() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000090
Alex Deymo610277e2014-11-11 21:18:11 -080091 void SetOffset(off_t offset) override { bytes_downloaded_ = offset; }
Gilad Arnolde4ad2502011-12-29 17:08:54 -080092
Alex Deymo610277e2014-11-11 21:18:11 -080093 void SetLength(size_t length) override { download_length_ = length; }
94 void UnsetLength() override { SetLength(0); }
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -070095
rspangler@google.com49fdf182009-10-10 00:57:34 +000096 // Begins the transfer if it hasn't already begun.
Alex Deymo610277e2014-11-11 21:18:11 -080097 void BeginTransfer(const std::string& url) override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000098
Darin Petkov9ce452b2010-11-17 14:33:28 -080099 // If the transfer is in progress, aborts the transfer early. The transfer
100 // cannot be resumed.
Alex Deymo610277e2014-11-11 21:18:11 -0800101 void TerminateTransfer() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000102
Alex Deymofdd6dec2016-03-03 22:35:43 -0800103 // Pass the headers to libcurl.
104 void SetHeader(const std::string& header_name,
105 const std::string& header_value) override;
106
Jae Hoon Kim0ae8fe12019-06-26 14:32:50 -0700107 bool GetHeader(const std::string& header_name,
108 std::string* header_value) const override;
109
rspangler@google.com49fdf182009-10-10 00:57:34 +0000110 // Suspend the transfer by calling curl_easy_pause(CURLPAUSE_ALL).
Alex Deymo610277e2014-11-11 21:18:11 -0800111 void Pause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000112
113 // Resume the transfer by calling curl_easy_pause(CURLPAUSE_CONT).
Alex Deymo610277e2014-11-11 21:18:11 -0800114 void Unpause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000115
116 // Libcurl sometimes asks to be called back after some time while
117 // leaving that time unspecified. In that case, we pick a reasonable
118 // default of one second, but it can be overridden here. This is
119 // primarily useful for testing.
120 // From http://curl.haxx.se/libcurl/c/curl_multi_timeout.html:
121 // if libcurl returns a -1 timeout here, it just means that libcurl
122 // currently has no stored timeout value. You must not wait too long
123 // (more than a few seconds perhaps) before you call
124 // curl_multi_perform() again.
Alex Deymo610277e2014-11-11 21:18:11 -0800125 void set_idle_seconds(int seconds) override { idle_seconds_ = seconds; }
Darin Petkovb83371f2010-08-17 09:34:49 -0700126
127 // Sets the retry timeout. Useful for testing.
Alex Deymo610277e2014-11-11 21:18:11 -0800128 void set_retry_seconds(int seconds) override { retry_seconds_ = seconds; }
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700129
Darin Petkova0929552010-11-29 14:19:06 -0800130 void set_no_network_max_retries(int retries) {
131 no_network_max_retries_ = retries;
132 }
133
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700134 int get_no_network_max_retries() { return no_network_max_retries_; }
135
Alex Deymo33e91e72015-12-01 18:26:08 -0300136 void set_server_to_check(ServerToCheck server_to_check) {
137 server_to_check_ = server_to_check;
138 }
139
Alex Deymo610277e2014-11-11 21:18:11 -0800140 size_t GetBytesDownloaded() override {
Gilad Arnold48085ba2011-11-16 09:36:08 -0800141 return static_cast<size_t>(bytes_downloaded_);
142 }
143
Alex Deymo610277e2014-11-11 21:18:11 -0800144 void set_low_speed_limit(int low_speed_bps, int low_speed_sec) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700145 low_speed_limit_bps_ = low_speed_bps;
146 low_speed_time_seconds_ = low_speed_sec;
147 }
148
Alex Deymo610277e2014-11-11 21:18:11 -0800149 void set_connect_timeout(int connect_timeout_seconds) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700150 connect_timeout_seconds_ = connect_timeout_seconds;
151 }
152
Alex Deymo610277e2014-11-11 21:18:11 -0800153 void set_max_retry_count(int max_retry_count) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700154 max_retry_count_ = max_retry_count;
155 }
156
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700157 void set_is_update_check(bool is_update_check) {
158 is_update_check_ = is_update_check;
159 }
160
rspangler@google.com49fdf182009-10-10 00:57:34 +0000161 private:
Amin Hassanid3d84212019-08-17 00:27:44 -0700162 FRIEND_TEST(LibcurlHttpFetcherTest, HostResolvedTest);
163
Alex Deymo13e95182017-03-16 19:06:13 -0700164 // libcurl's CURLOPT_CLOSESOCKETFUNCTION callback function. Called when
165 // closing a socket created with the CURLOPT_OPENSOCKETFUNCTION callback.
166 static int LibcurlCloseSocketCallback(void* clientp, curl_socket_t item);
167
Andrew de los Reyesf3ed8e72011-02-16 10:35:46 -0800168 // Callback for when proxy resolution has completed. This begins the
169 // transfer.
170 void ProxiesResolved();
Jay Srinivasan43488792012-06-19 00:25:31 -0700171
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700172 // Asks libcurl for the http response code and stores it in the object.
Amin Hassanid3d84212019-08-17 00:27:44 -0700173 virtual void GetHttpResponseCode();
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700174
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700175 // Returns the last |CURLcode|.
176 CURLcode GetCurlCode();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000177
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800178 // Checks whether stored HTTP response is within the success range.
Gilad Arnold48085ba2011-11-16 09:36:08 -0800179 inline bool IsHttpResponseSuccess() {
180 return (http_response_code_ >= 200 && http_response_code_ < 300);
181 }
182
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800183 // Checks whether stored HTTP response is within the error range. This
184 // includes both errors with the request (4xx) and server errors (5xx).
185 inline bool IsHttpResponseError() {
186 return (http_response_code_ >= 400 && http_response_code_ < 600);
187 }
188
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000189 // Resumes a transfer where it left off. This will use the
190 // HTTP Range: header to make a new connection from where the last
191 // left off.
192 virtual void ResumeTransfer(const std::string& url);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000193
Alex Deymo60ca1a72015-06-18 18:19:15 -0700194 void TimeoutCallback();
195 void RetryTimeoutCallback();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000196
197 // Calls into curl_multi_perform to let libcurl do its work. Returns after
198 // curl_multi_perform is finished, which may actually be after more than
Alex Deymo0b3db6b2015-08-10 15:19:37 -0700199 // one call to curl_multi_perform. This method will set up the message
Alex Deymof2858572016-02-25 11:20:13 -0800200 // loop with sources for future work that libcurl will do, if any, or complete
201 // the transfer and finish the action if no work left to do.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000202 // This method will not block.
Andrew de los Reyescb319332010-07-19 10:55:01 -0700203 void CurlPerformOnce();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000204
Alex Deymo29b81532015-07-09 11:51:49 -0700205 // Sets up message loop sources as needed by libcurl. This is generally
rspangler@google.com49fdf182009-10-10 00:57:34 +0000206 // the file descriptor of the socket and a timer in case nothing happens
207 // on the fds.
Alex Deymo29b81532015-07-09 11:51:49 -0700208 void SetupMessageLoopSources();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000209
210 // Callback called by libcurl when new data has arrived on the transfer
Amin Hassani7cc8bb02019-01-14 16:29:47 -0800211 size_t LibcurlWrite(void* ptr, size_t size, size_t nmemb);
212 static size_t StaticLibcurlWrite(void* ptr,
213 size_t size,
214 size_t nmemb,
215 void* stream) {
216 return reinterpret_cast<LibcurlHttpFetcher*>(stream)->LibcurlWrite(
217 ptr, size, nmemb);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000218 }
219
220 // Cleans up the following if they are non-null:
Tianjie55abd3c2020-06-19 00:22:59 -0700221 // curl(m) handles, fd_controller_maps_(fd_task_maps_), timeout_id_.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000222 void CleanUp();
223
Darin Petkov9ce452b2010-11-17 14:33:28 -0800224 // Force terminate the transfer. This will invoke the delegate's (if any)
225 // TransferTerminated callback so, after returning, this fetcher instance may
226 // be destroyed.
227 void ForceTransferTermination();
228
Jay Srinivasanb3f55402012-12-03 18:12:04 -0800229 // Sets the curl options for HTTP URL.
230 void SetCurlOptionsForHttp();
231
232 // Sets the curl options for HTTPS URL.
233 void SetCurlOptionsForHttps();
234
Alex Deymo56ccb072016-02-05 00:50:48 -0800235 // Sets the curl options for file URI.
236 void SetCurlOptionsForFile();
237
Gilad Arnold59d9e012013-07-23 16:41:43 -0700238 // Convert a proxy URL into a curl proxy type, if applicable. Returns true iff
239 // conversion was successful, false otherwise (in which case nothing is
240 // written to |out_type|).
241 bool GetProxyType(const std::string& proxy, curl_proxytype* out_type);
242
Alex Deymoc1c17b42015-11-23 03:53:15 -0300243 // Hardware interface used to query dev-mode and official build settings.
244 HardwareInterface* hardware_;
245
rspangler@google.com49fdf182009-10-10 00:57:34 +0000246 // Handles for the libcurl library
Alex Deymo60ca1a72015-06-18 18:19:15 -0700247 CURLM* curl_multi_handle_{nullptr};
248 CURL* curl_handle_{nullptr};
249 struct curl_slist* curl_http_headers_{nullptr};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000250
Alex Deymofdd6dec2016-03-03 22:35:43 -0800251 // The extra headers that will be sent on each request.
252 std::map<std::string, std::string> extra_headers_;
253
Darin Petkov60e14152010-10-27 16:57:04 -0700254 // Lists of all read(0)/write(1) file descriptors that we're waiting on from
Alex Deymo29b81532015-07-09 11:51:49 -0700255 // the message loop. libcurl may open/close descriptors and switch their
Darin Petkov60e14152010-10-27 16:57:04 -0700256 // directions so maintain two separate lists so that watch conditions can be
257 // set appropriately.
Hidehiko Abe493fecb2019-07-10 23:30:50 +0900258 std::map<int, std::unique_ptr<base::FileDescriptorWatcher::Controller>>
259 fd_controller_maps_[2];
rspangler@google.com49fdf182009-10-10 00:57:34 +0000260
Alex Deymo60ca1a72015-06-18 18:19:15 -0700261 // The TaskId of the timer we're waiting on. kTaskIdNull if we are not waiting
262 // on it.
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -0700263 brillo::MessageLoop::TaskId timeout_id_{brillo::MessageLoop::kTaskIdNull};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000264
Alex Deymo29b81532015-07-09 11:51:49 -0700265 bool transfer_in_progress_{false};
Alex Deymof2858572016-02-25 11:20:13 -0800266 bool transfer_paused_{false};
267
268 // Whether it should ignore transfer failures for the purpose of retrying the
269 // connection.
270 bool ignore_failure_{false};
271
272 // Whether we should restart the transfer once Unpause() is called. This can
273 // be caused because either the connection dropped while pause or the proxy
274 // was resolved and we never started the transfer in the first place.
275 bool restart_transfer_on_unpause_{false};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000276
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000277 // The transfer size. -1 if not known.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700278 off_t transfer_size_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000279
280 // How many bytes have been downloaded and sent to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700281 off_t bytes_downloaded_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000282
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800283 // The remaining maximum number of bytes to download. Zero represents an
284 // unspecified length.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700285 size_t download_length_{0};
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800286
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000287 // If we resumed an earlier transfer, data offset that we used for the
288 // new connection. 0 otherwise.
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700289 // In this class, resume refers to resuming a dropped HTTP connection,
290 // not to resuming an interrupted download.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700291 off_t resume_offset_{0};
Darin Petkovb83371f2010-08-17 09:34:49 -0700292
Jay Srinivasan32f23572012-06-05 13:45:07 -0700293 // Number of resumes performed so far and the max allowed.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700294 int retry_count_{0};
295 int max_retry_count_{kDownloadMaxRetryCount};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000296
Darin Petkovb83371f2010-08-17 09:34:49 -0700297 // Seconds to wait before retrying a resume.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700298 int retry_seconds_{20};
Darin Petkovb83371f2010-08-17 09:34:49 -0700299
Alex Deymob20de692017-02-05 07:47:37 +0000300 // When waiting for a retry, the task id of the retry callback.
301 brillo::MessageLoop::TaskId retry_task_id_{brillo::MessageLoop::kTaskIdNull};
302
Darin Petkova0929552010-11-29 14:19:06 -0800303 // Number of resumes due to no network (e.g., HTTP response code 0).
Alex Deymo60ca1a72015-06-18 18:19:15 -0700304 int no_network_retry_count_{0};
305 int no_network_max_retries_{0};
Darin Petkova0929552010-11-29 14:19:06 -0800306
Darin Petkovb83371f2010-08-17 09:34:49 -0700307 // Seconds to wait before asking libcurl to "perform".
Alex Deymo60ca1a72015-06-18 18:19:15 -0700308 int idle_seconds_{1};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700309
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700310 // If true, we are currently performing a write callback on the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700311 bool in_write_callback_{false};
Darin Petkova0929552010-11-29 14:19:06 -0800312
Andrew de los Reyes45168102010-11-22 11:13:50 -0800313 // If true, we have returned at least one byte in the write callback
314 // to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700315 bool sent_byte_{false};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700316
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700317 // We can't clean everything up while we're in a write callback, so
318 // if we get a terminate request, queue it until we can handle it.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700319 bool terminate_requested_{false};
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700320
Alex Deymo33e91e72015-12-01 18:26:08 -0300321 // The ServerToCheck used when checking this connection's certificate. If no
322 // certificate check needs to be performed, this should be set to
323 // ServerToCheck::kNone.
324 ServerToCheck server_to_check_{ServerToCheck::kNone};
Bruno Rocha7f9aea22011-09-12 14:31:24 -0700325
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700326 // True if this object is for update check.
327 bool is_update_check_{false};
328
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700329 // Internal state machine.
330 UnresolvedHostStateMachine unresolved_host_state_machine_;
331
Alex Deymo60ca1a72015-06-18 18:19:15 -0700332 int low_speed_limit_bps_{kDownloadLowSpeedLimitBps};
333 int low_speed_time_seconds_{kDownloadLowSpeedTimeSeconds};
334 int connect_timeout_seconds_{kDownloadConnectTimeoutSeconds};
David Zeuthen34135a92013-08-06 11:16:16 -0700335
rspangler@google.com49fdf182009-10-10 00:57:34 +0000336 DISALLOW_COPY_AND_ASSIGN(LibcurlHttpFetcher);
337};
338
339} // namespace chromeos_update_engine
340
Alex Deymo14c0da82016-07-20 16:45:45 -0700341#endif // UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_