blob: 0e34f9d2cf17c56b7f1725755afc7730605f1798 [file] [log] [blame]
Alex Deymoaea4c1c2015-08-19 20:24:43 -07001//
2// Copyright (C) 2009 The Android Open Source Project
3//
4// Licensed under the Apache License, Version 2.0 (the "License");
5// you may not use this file except in compliance with the License.
6// You may obtain a copy of the License at
7//
8// http://www.apache.org/licenses/LICENSE-2.0
9//
10// Unless required by applicable law or agreed to in writing, software
11// distributed under the License is distributed on an "AS IS" BASIS,
12// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13// See the License for the specific language governing permissions and
14// limitations under the License.
15//
rspangler@google.com49fdf182009-10-10 00:57:34 +000016
Alex Deymo14c0da82016-07-20 16:45:45 -070017#ifndef UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
18#define UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_
rspangler@google.com49fdf182009-10-10 00:57:34 +000019
20#include <map>
Alex Deymoc1c17b42015-11-23 03:53:15 -030021#include <memory>
rspangler@google.com49fdf182009-10-10 00:57:34 +000022#include <string>
Alex Vakulenkod2779df2014-06-16 13:19:00 -070023#include <utility>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070024
rspangler@google.com49fdf182009-10-10 00:57:34 +000025#include <curl/curl.h>
Bruno Rocha7f9aea22011-09-12 14:31:24 -070026
Hidehiko Abe493fecb2019-07-10 23:30:50 +090027#include <base/files/file_descriptor_watcher_posix.h>
Ben Chan05735a12014-09-03 07:48:22 -070028#include <base/logging.h>
29#include <base/macros.h>
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -070030#include <brillo/message_loops/message_loop.h>
Ben Chan05735a12014-09-03 07:48:22 -070031
Alex Deymo14c0da82016-07-20 16:45:45 -070032#include "update_engine/certificate_checker.h"
Alex Deymo39910dc2015-11-09 17:04:30 -080033#include "update_engine/common/hardware_interface.h"
34#include "update_engine/common/http_fetcher.h"
Jay Srinivasan43488792012-06-19 00:25:31 -070035
rspangler@google.com49fdf182009-10-10 00:57:34 +000036// This is a concrete implementation of HttpFetcher that uses libcurl to do the
37// http work.
38
39namespace chromeos_update_engine {
40
Xiaochu Liub5ba7972019-07-11 09:51:06 -070041// |UnresolvedHostStateMachine| is a representation of internal state machine of
42// |LibcurlHttpFetcher|.
43class UnresolvedHostStateMachine {
44 public:
45 UnresolvedHostStateMachine() = default;
46 enum class State {
47 kInit = 0,
48 kRetry = 1,
49 kRetriedSuccess = 2,
50 kNotRetry = 3,
51 };
52
Amin Hassanid3d84212019-08-17 00:27:44 -070053 State GetState() { return state_; }
Xiaochu Liub5ba7972019-07-11 09:51:06 -070054
55 // Updates the following internal state machine:
56 //
57 // |kInit|
58 // |
59 // |
60 // \/
61 // (Try, host Unresolved)
62 // |
63 // |
64 // \/
65 // |kRetry| --> (Retry, host resolved)
66 // | |
67 // | |
68 // \/ \/
69 // (Retry, host Unresolved) |kRetriedSuccess|
70 // |
71 // |
72 // \/
73 // |kNotRetry|
74 //
75 void UpdateState(bool failed_to_resolve_host);
76
77 private:
78 State state_ = {State::kInit};
79
80 DISALLOW_COPY_AND_ASSIGN(UnresolvedHostStateMachine);
81};
82
rspangler@google.com49fdf182009-10-10 00:57:34 +000083class LibcurlHttpFetcher : public HttpFetcher {
84 public:
Daniel Zheng0c1648c2023-04-12 10:57:44 -070085 explicit LibcurlHttpFetcher(HardwareInterface* hardware);
rspangler@google.com49fdf182009-10-10 00:57:34 +000086
87 // Cleans up all internal state. Does not notify delegate
Alex Deymo610277e2014-11-11 21:18:11 -080088 ~LibcurlHttpFetcher() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000089
Alex Deymo610277e2014-11-11 21:18:11 -080090 void SetOffset(off_t offset) override { bytes_downloaded_ = offset; }
Gilad Arnolde4ad2502011-12-29 17:08:54 -080091
Alex Deymo610277e2014-11-11 21:18:11 -080092 void SetLength(size_t length) override { download_length_ = length; }
93 void UnsetLength() override { SetLength(0); }
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -070094
rspangler@google.com49fdf182009-10-10 00:57:34 +000095 // Begins the transfer if it hasn't already begun.
Alex Deymo610277e2014-11-11 21:18:11 -080096 void BeginTransfer(const std::string& url) override;
rspangler@google.com49fdf182009-10-10 00:57:34 +000097
Darin Petkov9ce452b2010-11-17 14:33:28 -080098 // If the transfer is in progress, aborts the transfer early. The transfer
99 // cannot be resumed.
Alex Deymo610277e2014-11-11 21:18:11 -0800100 void TerminateTransfer() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000101
Alex Deymofdd6dec2016-03-03 22:35:43 -0800102 // Pass the headers to libcurl.
103 void SetHeader(const std::string& header_name,
104 const std::string& header_value) override;
105
Jae Hoon Kim0ae8fe12019-06-26 14:32:50 -0700106 bool GetHeader(const std::string& header_name,
107 std::string* header_value) const override;
108
rspangler@google.com49fdf182009-10-10 00:57:34 +0000109 // Suspend the transfer by calling curl_easy_pause(CURLPAUSE_ALL).
Alex Deymo610277e2014-11-11 21:18:11 -0800110 void Pause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000111
112 // Resume the transfer by calling curl_easy_pause(CURLPAUSE_CONT).
Alex Deymo610277e2014-11-11 21:18:11 -0800113 void Unpause() override;
rspangler@google.com49fdf182009-10-10 00:57:34 +0000114
115 // Libcurl sometimes asks to be called back after some time while
116 // leaving that time unspecified. In that case, we pick a reasonable
117 // default of one second, but it can be overridden here. This is
118 // primarily useful for testing.
119 // From http://curl.haxx.se/libcurl/c/curl_multi_timeout.html:
120 // if libcurl returns a -1 timeout here, it just means that libcurl
121 // currently has no stored timeout value. You must not wait too long
122 // (more than a few seconds perhaps) before you call
123 // curl_multi_perform() again.
Alex Deymo610277e2014-11-11 21:18:11 -0800124 void set_idle_seconds(int seconds) override { idle_seconds_ = seconds; }
Darin Petkovb83371f2010-08-17 09:34:49 -0700125
126 // Sets the retry timeout. Useful for testing.
Alex Deymo610277e2014-11-11 21:18:11 -0800127 void set_retry_seconds(int seconds) override { retry_seconds_ = seconds; }
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700128
Darin Petkova0929552010-11-29 14:19:06 -0800129 void set_no_network_max_retries(int retries) {
130 no_network_max_retries_ = retries;
131 }
132
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700133 int get_no_network_max_retries() { return no_network_max_retries_; }
134
Alex Deymo33e91e72015-12-01 18:26:08 -0300135 void set_server_to_check(ServerToCheck server_to_check) {
136 server_to_check_ = server_to_check;
137 }
138
Alex Deymo610277e2014-11-11 21:18:11 -0800139 size_t GetBytesDownloaded() override {
Gilad Arnold48085ba2011-11-16 09:36:08 -0800140 return static_cast<size_t>(bytes_downloaded_);
141 }
142
Alex Deymo610277e2014-11-11 21:18:11 -0800143 void set_low_speed_limit(int low_speed_bps, int low_speed_sec) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700144 low_speed_limit_bps_ = low_speed_bps;
145 low_speed_time_seconds_ = low_speed_sec;
146 }
147
Alex Deymo610277e2014-11-11 21:18:11 -0800148 void set_connect_timeout(int connect_timeout_seconds) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700149 connect_timeout_seconds_ = connect_timeout_seconds;
150 }
151
Alex Deymo610277e2014-11-11 21:18:11 -0800152 void set_max_retry_count(int max_retry_count) override {
David Zeuthen34135a92013-08-06 11:16:16 -0700153 max_retry_count_ = max_retry_count;
154 }
155
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700156 void set_is_update_check(bool is_update_check) {
157 is_update_check_ = is_update_check;
158 }
159
rspangler@google.com49fdf182009-10-10 00:57:34 +0000160 private:
Amin Hassanid3d84212019-08-17 00:27:44 -0700161 FRIEND_TEST(LibcurlHttpFetcherTest, HostResolvedTest);
162
Alex Deymo13e95182017-03-16 19:06:13 -0700163 // libcurl's CURLOPT_CLOSESOCKETFUNCTION callback function. Called when
164 // closing a socket created with the CURLOPT_OPENSOCKETFUNCTION callback.
165 static int LibcurlCloseSocketCallback(void* clientp, curl_socket_t item);
166
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700167 // Asks libcurl for the http response code and stores it in the object.
Amin Hassanid3d84212019-08-17 00:27:44 -0700168 virtual void GetHttpResponseCode();
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700169
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700170 // Returns the last |CURLcode|.
171 CURLcode GetCurlCode();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000172
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800173 // Checks whether stored HTTP response is within the success range.
Gilad Arnold48085ba2011-11-16 09:36:08 -0800174 inline bool IsHttpResponseSuccess() {
175 return (http_response_code_ >= 200 && http_response_code_ < 300);
176 }
177
Gilad Arnold9bedeb52011-11-17 16:19:57 -0800178 // Checks whether stored HTTP response is within the error range. This
179 // includes both errors with the request (4xx) and server errors (5xx).
180 inline bool IsHttpResponseError() {
181 return (http_response_code_ >= 400 && http_response_code_ < 600);
182 }
183
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000184 // Resumes a transfer where it left off. This will use the
185 // HTTP Range: header to make a new connection from where the last
186 // left off.
187 virtual void ResumeTransfer(const std::string& url);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000188
Alex Deymo60ca1a72015-06-18 18:19:15 -0700189 void TimeoutCallback();
190 void RetryTimeoutCallback();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000191
192 // Calls into curl_multi_perform to let libcurl do its work. Returns after
193 // curl_multi_perform is finished, which may actually be after more than
Alex Deymo0b3db6b2015-08-10 15:19:37 -0700194 // one call to curl_multi_perform. This method will set up the message
Alex Deymof2858572016-02-25 11:20:13 -0800195 // loop with sources for future work that libcurl will do, if any, or complete
196 // the transfer and finish the action if no work left to do.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000197 // This method will not block.
Andrew de los Reyescb319332010-07-19 10:55:01 -0700198 void CurlPerformOnce();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000199
Alex Deymo29b81532015-07-09 11:51:49 -0700200 // Sets up message loop sources as needed by libcurl. This is generally
rspangler@google.com49fdf182009-10-10 00:57:34 +0000201 // the file descriptor of the socket and a timer in case nothing happens
202 // on the fds.
Alex Deymo29b81532015-07-09 11:51:49 -0700203 void SetupMessageLoopSources();
rspangler@google.com49fdf182009-10-10 00:57:34 +0000204
205 // Callback called by libcurl when new data has arrived on the transfer
Amin Hassani7cc8bb02019-01-14 16:29:47 -0800206 size_t LibcurlWrite(void* ptr, size_t size, size_t nmemb);
207 static size_t StaticLibcurlWrite(void* ptr,
208 size_t size,
209 size_t nmemb,
210 void* stream) {
211 return reinterpret_cast<LibcurlHttpFetcher*>(stream)->LibcurlWrite(
212 ptr, size, nmemb);
rspangler@google.com49fdf182009-10-10 00:57:34 +0000213 }
214
215 // Cleans up the following if they are non-null:
Tianjie55abd3c2020-06-19 00:22:59 -0700216 // curl(m) handles, fd_controller_maps_(fd_task_maps_), timeout_id_.
rspangler@google.com49fdf182009-10-10 00:57:34 +0000217 void CleanUp();
218
Darin Petkov9ce452b2010-11-17 14:33:28 -0800219 // Force terminate the transfer. This will invoke the delegate's (if any)
220 // TransferTerminated callback so, after returning, this fetcher instance may
221 // be destroyed.
222 void ForceTransferTermination();
223
Jay Srinivasanb3f55402012-12-03 18:12:04 -0800224 // Sets the curl options for HTTP URL.
225 void SetCurlOptionsForHttp();
226
227 // Sets the curl options for HTTPS URL.
228 void SetCurlOptionsForHttps();
229
Alex Deymo56ccb072016-02-05 00:50:48 -0800230 // Sets the curl options for file URI.
231 void SetCurlOptionsForFile();
232
Gilad Arnold59d9e012013-07-23 16:41:43 -0700233 // Convert a proxy URL into a curl proxy type, if applicable. Returns true iff
234 // conversion was successful, false otherwise (in which case nothing is
235 // written to |out_type|).
236 bool GetProxyType(const std::string& proxy, curl_proxytype* out_type);
237
Alex Deymoc1c17b42015-11-23 03:53:15 -0300238 // Hardware interface used to query dev-mode and official build settings.
239 HardwareInterface* hardware_;
240
rspangler@google.com49fdf182009-10-10 00:57:34 +0000241 // Handles for the libcurl library
Alex Deymo60ca1a72015-06-18 18:19:15 -0700242 CURLM* curl_multi_handle_{nullptr};
243 CURL* curl_handle_{nullptr};
244 struct curl_slist* curl_http_headers_{nullptr};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000245
Alex Deymofdd6dec2016-03-03 22:35:43 -0800246 // The extra headers that will be sent on each request.
247 std::map<std::string, std::string> extra_headers_;
248
Darin Petkov60e14152010-10-27 16:57:04 -0700249 // Lists of all read(0)/write(1) file descriptors that we're waiting on from
Alex Deymo29b81532015-07-09 11:51:49 -0700250 // the message loop. libcurl may open/close descriptors and switch their
Darin Petkov60e14152010-10-27 16:57:04 -0700251 // directions so maintain two separate lists so that watch conditions can be
252 // set appropriately.
Hidehiko Abe493fecb2019-07-10 23:30:50 +0900253 std::map<int, std::unique_ptr<base::FileDescriptorWatcher::Controller>>
254 fd_controller_maps_[2];
rspangler@google.com49fdf182009-10-10 00:57:34 +0000255
Alex Deymo60ca1a72015-06-18 18:19:15 -0700256 // The TaskId of the timer we're waiting on. kTaskIdNull if we are not waiting
257 // on it.
Alex Vakulenko3f39d5c2015-10-13 09:27:13 -0700258 brillo::MessageLoop::TaskId timeout_id_{brillo::MessageLoop::kTaskIdNull};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000259
Alex Deymo29b81532015-07-09 11:51:49 -0700260 bool transfer_in_progress_{false};
Alex Deymof2858572016-02-25 11:20:13 -0800261 bool transfer_paused_{false};
262
263 // Whether it should ignore transfer failures for the purpose of retrying the
264 // connection.
265 bool ignore_failure_{false};
266
267 // Whether we should restart the transfer once Unpause() is called. This can
268 // be caused because either the connection dropped while pause or the proxy
269 // was resolved and we never started the transfer in the first place.
270 bool restart_transfer_on_unpause_{false};
rspangler@google.com49fdf182009-10-10 00:57:34 +0000271
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000272 // The transfer size. -1 if not known.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700273 off_t transfer_size_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000274
275 // How many bytes have been downloaded and sent to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700276 off_t bytes_downloaded_{0};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000277
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800278 // The remaining maximum number of bytes to download. Zero represents an
279 // unspecified length.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700280 size_t download_length_{0};
Gilad Arnolde4ad2502011-12-29 17:08:54 -0800281
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000282 // If we resumed an earlier transfer, data offset that we used for the
283 // new connection. 0 otherwise.
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700284 // In this class, resume refers to resuming a dropped HTTP connection,
285 // not to resuming an interrupted download.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700286 off_t resume_offset_{0};
Darin Petkovb83371f2010-08-17 09:34:49 -0700287
Jay Srinivasan32f23572012-06-05 13:45:07 -0700288 // Number of resumes performed so far and the max allowed.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700289 int retry_count_{0};
290 int max_retry_count_{kDownloadMaxRetryCount};
adlr@google.comc98a7ed2009-12-04 18:54:03 +0000291
Darin Petkovb83371f2010-08-17 09:34:49 -0700292 // Seconds to wait before retrying a resume.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700293 int retry_seconds_{20};
Darin Petkovb83371f2010-08-17 09:34:49 -0700294
Alex Deymob20de692017-02-05 07:47:37 +0000295 // When waiting for a retry, the task id of the retry callback.
296 brillo::MessageLoop::TaskId retry_task_id_{brillo::MessageLoop::kTaskIdNull};
297
Darin Petkova0929552010-11-29 14:19:06 -0800298 // Number of resumes due to no network (e.g., HTTP response code 0).
Alex Deymo60ca1a72015-06-18 18:19:15 -0700299 int no_network_retry_count_{0};
300 int no_network_max_retries_{0};
Darin Petkova0929552010-11-29 14:19:06 -0800301
Darin Petkovb83371f2010-08-17 09:34:49 -0700302 // Seconds to wait before asking libcurl to "perform".
Alex Deymo60ca1a72015-06-18 18:19:15 -0700303 int idle_seconds_{1};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700304
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700305 // If true, we are currently performing a write callback on the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700306 bool in_write_callback_{false};
Darin Petkova0929552010-11-29 14:19:06 -0800307
Andrew de los Reyes45168102010-11-22 11:13:50 -0800308 // If true, we have returned at least one byte in the write callback
309 // to the delegate.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700310 bool sent_byte_{false};
Darin Petkovfc7a0ce2010-10-25 10:38:37 -0700311
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700312 // We can't clean everything up while we're in a write callback, so
313 // if we get a terminate request, queue it until we can handle it.
Alex Deymo60ca1a72015-06-18 18:19:15 -0700314 bool terminate_requested_{false};
Andrew de los Reyes3fd5d302010-10-07 20:07:18 -0700315
Alex Deymo33e91e72015-12-01 18:26:08 -0300316 // The ServerToCheck used when checking this connection's certificate. If no
317 // certificate check needs to be performed, this should be set to
318 // ServerToCheck::kNone.
319 ServerToCheck server_to_check_{ServerToCheck::kNone};
Bruno Rocha7f9aea22011-09-12 14:31:24 -0700320
Xiaochu Liu4a1173a2019-04-10 10:49:08 -0700321 // True if this object is for update check.
322 bool is_update_check_{false};
323
Xiaochu Liub5ba7972019-07-11 09:51:06 -0700324 // Internal state machine.
325 UnresolvedHostStateMachine unresolved_host_state_machine_;
326
Alex Deymo60ca1a72015-06-18 18:19:15 -0700327 int low_speed_limit_bps_{kDownloadLowSpeedLimitBps};
328 int low_speed_time_seconds_{kDownloadLowSpeedTimeSeconds};
329 int connect_timeout_seconds_{kDownloadConnectTimeoutSeconds};
David Zeuthen34135a92013-08-06 11:16:16 -0700330
rspangler@google.com49fdf182009-10-10 00:57:34 +0000331 DISALLOW_COPY_AND_ASSIGN(LibcurlHttpFetcher);
332};
333
334} // namespace chromeos_update_engine
335
Alex Deymo14c0da82016-07-20 16:45:45 -0700336#endif // UPDATE_ENGINE_LIBCURL_HTTP_FETCHER_H_