HTTPClient.cpp 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299
  1. // Copyright (c) Kuba Szczodrzyński 2021-12-21.
  2. #include "HTTPClient.h"
  3. #include "TCPSocket.h"
  4. using namespace bell;
  5. void HTTPClient::HTTPResponse::close() {
  6. socket = nullptr;
  7. if (buf)
  8. free(buf);
  9. buf = nullptr;
  10. bufPtr = nullptr;
  11. }
  12. HTTPClient::HTTPResponse::~HTTPResponse() {
  13. socket = nullptr;
  14. if (buf)
  15. free(buf);
  16. }
  17. HTTPResponse_t HTTPClient::execute(const struct HTTPRequest &request) {
  18. auto response = std::make_unique<HTTPResponse>();
  19. response->dumpFs = request.dumpFs;
  20. response->dumpRawFs = request.dumpRawFs;
  21. return HTTPClient::executeImpl(request, std::move(response));
  22. }
  23. HTTPResponse_t HTTPClient::executeImpl(const struct HTTPRequest &request, HTTPResponse_t response) {
  24. const char *url = request.url.c_str();
  25. if (response->isRedirect) {
  26. url = response->location.c_str();
  27. }
  28. bool https = url[4] == 's';
  29. uint16_t port = https ? 443 : 80;
  30. auto *hostname = url + (https ? 8 : 7);
  31. auto *hostnameEnd = strchr(hostname, ':');
  32. auto *path = strchr(hostname, '/');
  33. if (hostnameEnd == nullptr) {
  34. hostnameEnd = path;
  35. } else {
  36. port = strtol(hostnameEnd + 1, nullptr, 10);
  37. }
  38. auto hostnameStr = std::string(hostname, (const char *)hostnameEnd);
  39. if (https) {
  40. response->socket = std::make_shared<TLSSocket>();
  41. } else {
  42. response->socket = std::make_shared<TCPSocket>();
  43. }
  44. response->socket->open(hostnameStr, port);
  45. const char *endl = "\r\n";
  46. std::stringstream stream;
  47. switch (request.method) {
  48. case HTTPMethod::GET:
  49. stream << "GET ";
  50. break;
  51. case HTTPMethod::POST:
  52. stream << "POST ";
  53. break;
  54. }
  55. stream << path << " HTTP/1.1" << endl;
  56. stream << "Host: " << hostnameStr << ":" << port << endl;
  57. stream << "Accept: */*" << endl;
  58. if (request.body != nullptr) {
  59. stream << "Content-Type: " << request.contentType << endl;
  60. stream << "Content-Length: " << strlen(request.body) << endl;
  61. }
  62. for (const auto &header : request.headers) {
  63. stream << header.first << ": " << header.second << endl;
  64. }
  65. stream << endl;
  66. stream << request.body;
  67. std::string data = stream.str();
  68. size_t len = response->socket->write((uint8_t *)data.c_str(), data.size());
  69. if (len != data.size()) {
  70. response->close();
  71. BELL_LOG(error, "http", "Writing failed: wrote %d of %d bytes", len, data.size());
  72. return nullptr;
  73. }
  74. response->readHeaders();
  75. if (response->isRedirect && (request.maxRedirects < 0 || response->redirectCount < request.maxRedirects)) {
  76. response->redirectCount++;
  77. response->close(); // close the previous socket
  78. return HTTPClient::executeImpl(request, std::move(response));
  79. }
  80. return response;
  81. }
  82. bool HTTPClient::readHeader(const char *&header, const char *name) {
  83. size_t len = strlen(name);
  84. if (strncasecmp(header, name, len) == 0) {
  85. header += len;
  86. while (*header == ' ')
  87. header++;
  88. return true;
  89. }
  90. return false;
  91. }
  92. size_t HTTPClient::HTTPResponse::readRaw(char *dst) {
  93. size_t len = this->socket->read((uint8_t *)dst, BUF_SIZE);
  94. if (dumpRawFs)
  95. dumpRawFs->write(dst, (long)len);
  96. // BELL_LOG(debug, "http", "Read %d bytes", len);
  97. dst[len] = '\0';
  98. return len;
  99. }
  100. void HTTPClient::HTTPResponse::readHeaders() {
  101. size_t len;
  102. char *line, *lineEnd;
  103. bool complete = false;
  104. std::string lineBuf;
  105. if (this->buf == nullptr) { // allocate a buffer
  106. this->buf = static_cast<char *>(malloc(BUF_SIZE + 1));
  107. this->bufPtr = this->buf;
  108. }
  109. // reset everything after a redirect
  110. this->statusCode = 0;
  111. this->contentLength = 0;
  112. this->isChunked = false;
  113. this->isGzip = false;
  114. this->isComplete = false;
  115. this->isRedirect = false;
  116. this->isStreaming = false;
  117. do {
  118. len = this->readRaw(this->buf);
  119. line = this->buf;
  120. do {
  121. lineEnd = strstr(line, "\r\n");
  122. if (!lineEnd) {
  123. lineBuf += std::string(line, this->buf + len);
  124. break;
  125. }
  126. lineBuf += std::string(line, lineEnd);
  127. if (lineBuf.empty()) {
  128. complete = true;
  129. // if body is present in buf, move the reading pointer
  130. if (lineEnd + 2 < this->buf + len) {
  131. this->bufPtr = lineEnd + 2;
  132. this->bufRemaining = len - (this->bufPtr - this->buf);
  133. this->isStreaming =
  134. !this->isComplete && !this->contentLength && (len < BUF_SIZE || this->socket->poll() == 0);
  135. }
  136. break;
  137. }
  138. auto *header = lineBuf.c_str();
  139. if (strncmp(header, "HTTP/", 5) == 0) {
  140. header += 9; // skip "1.1 "
  141. this->statusCode = strtol(header, nullptr, 10);
  142. } else if (readHeader(header, "content-type:")) {
  143. this->contentType = std::string(header);
  144. } else if (readHeader(header, "content-length:")) {
  145. this->contentLength = strtol(header, nullptr, 10);
  146. if (!this->contentLength)
  147. this->isComplete = true; // forbid reading of the body
  148. } else if (readHeader(header, "transfer-encoding:")) {
  149. this->isChunked = strncmp(header, "chunked", 7) == 0;
  150. } else if (readHeader(header, "location:")) {
  151. this->isRedirect = true;
  152. this->location = std::string(header);
  153. } else {
  154. auto *colonPtr = strchr((char *)header, ':');
  155. if (colonPtr) {
  156. auto *valuePtr = colonPtr + 1;
  157. while (*valuePtr == ' ')
  158. valuePtr++;
  159. *colonPtr = '\0';
  160. for (auto *p = (char *)header; *p; ++p) // convert header name to lower case
  161. *p = (char)tolower(*p);
  162. this->headers[std::string(header)] = std::string(valuePtr);
  163. }
  164. }
  165. lineBuf.clear();
  166. line = lineEnd + 2; // skip \r\n
  167. } while (true);
  168. } while (!complete && len); // if len == 0, the connection is closed
  169. }
  170. bool HTTPClient::HTTPResponse::skipRaw(size_t len, bool dontRead) {
  171. size_t skip = 0;
  172. if (len > bufRemaining) {
  173. skip = len - bufRemaining;
  174. len = bufRemaining;
  175. }
  176. bufRemaining -= len;
  177. bufPtr += len;
  178. if (!bufRemaining && !dontRead) { // don't read more data after a chunk's \r\n
  179. if (isComplete || (contentLength && bodyRead >= contentLength && !chunkRemaining)) {
  180. isComplete = true;
  181. return false;
  182. }
  183. bufRemaining = this->readRaw(this->buf);
  184. if (!bufRemaining)
  185. return false; // if len == 0, the connection is closed
  186. bufPtr = this->buf + skip;
  187. bufRemaining -= skip;
  188. if (!contentLength && bufRemaining < BUF_SIZE) {
  189. // no content length set and the TCP buffer is not yielding more data, yet
  190. isStreaming = true;
  191. }
  192. }
  193. return true;
  194. }
  195. size_t HTTPClient::HTTPResponse::read(char *dst, size_t toRead, bool wait) {
  196. if (isComplete) {
  197. // end of chunked stream was found OR complete body was read
  198. return 0;
  199. }
  200. auto *dstStart = dst ? dst : nullptr;
  201. size_t read = 0;
  202. while (toRead) { // this loop ends after original toRead
  203. skipRaw(0); // ensure the buffer contains data, wait if necessary
  204. if (isChunked && !chunkRemaining) {
  205. if (*bufPtr == '0') { // all chunks were read *and emitted*
  206. isComplete = true;
  207. break;
  208. }
  209. auto *endPtr = bufPtr;
  210. if (strchr(bufPtr, '\r') == nullptr) { // buf doesn't contain complete chunk size
  211. auto size = std::string(bufPtr, bufPtr + bufRemaining); // take the rest of the buffer
  212. if (!skipRaw(bufRemaining)) // skip the rest, read another buf
  213. break; // -> no more data
  214. endPtr = strchr(bufPtr, '\r'); // find the end of the actual number
  215. if (endPtr == nullptr) // something's wrong
  216. break; // - give up
  217. size += std::string(bufPtr, endPtr); // append the newly read size
  218. chunkRemaining = std::stoul(size, nullptr, 16); // read the hex size
  219. } else {
  220. chunkRemaining = strtol(bufPtr, &endPtr, 16); // read the hex size
  221. }
  222. if (!skipRaw(endPtr - bufPtr + 2)) // skip the size and \r\n
  223. break; // -> no more data, break out of main loop
  224. } else if (contentLength && !chunkRemaining) {
  225. chunkRemaining = contentLength;
  226. }
  227. while (chunkRemaining && toRead) {
  228. size_t count = std::min(toRead, std::min(bufRemaining, chunkRemaining));
  229. if (dst) {
  230. memcpy(dst, bufPtr, count);
  231. dst += count; // move the dst pointer
  232. }
  233. read += count; // increment read counter
  234. bodyRead += count; // increment total response size
  235. chunkRemaining -= count; // decrease chunk remaining size
  236. toRead -= count; // decrease local remaining size
  237. if (!skipRaw(count)) { // eat some buffer
  238. toRead = 0; // -> no more data, break out of main loop
  239. break;
  240. }
  241. if (isChunked && !chunkRemaining) { // bufPtr is on the end of chunk
  242. if (!skipRaw(2, isStreaming)) // skip the \r\n for chunked encoding
  243. toRead = 0; // -> no more data, break out of main loop
  244. if (bufRemaining > 1 && bufPtr[0] == '0' && bufPtr[1] == '\r') // this is the last chunk
  245. isComplete = true;
  246. }
  247. }
  248. if (isStreaming && !bufRemaining && !wait) { // stream with no buffer available, just yield the current chunk
  249. break;
  250. }
  251. }
  252. if (!isChunked && contentLength && !chunkRemaining)
  253. isComplete = true; // entire response was read
  254. if (dumpFs && dstStart)
  255. dumpFs->write(dstStart, (long)read);
  256. // BELL_LOG(debug, "http", "Read %d of %d bytes", bodyRead, contentLength);
  257. return read;
  258. }
  259. std::string HTTPClient::HTTPResponse::readToString() {
  260. if (this->contentLength) {
  261. std::string result(this->contentLength, '\0');
  262. auto *data = result.data();
  263. auto len = this->read(data, this->contentLength);
  264. data[len] = '\0';
  265. this->close();
  266. return result;
  267. }
  268. std::string result;
  269. char buffer[BUF_SIZE+1]; // make space for null-terminator
  270. size_t len;
  271. do {
  272. len = this->read(buffer, BUF_SIZE);
  273. buffer[len] = '\0';
  274. result += std::string(buffer);
  275. } while (len);
  276. this->close();
  277. return result;
  278. }