http_content.cpp 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309
  1. #include "http_content.h"
  2. #include "hfile.h"
  3. #include "hstring.h"
  4. #ifndef LOWER
  5. #define LOWER(c) ((c) | 0x20)
  6. #endif
  7. #ifndef UPPER
  8. #define UPPER(c) ((c) & ~0x20)
  9. #endif
  10. #ifndef IS_NUM
  11. #define IS_NUM(c) ((c) >= '0' && (c) <= '9')
  12. #endif
  13. #ifndef IS_ALPHA
  14. #define IS_ALPHA(c) (((c) >= 'a' && (c) <= 'z') || ((c) >= 'A' && (c) <= 'A'))
  15. #endif
  16. #ifndef IS_ALPHANUM
  17. #define IS_ALPHANUM(c) (IS_NUM(c) || IS_ALPHA(c))
  18. #endif
  19. #ifndef IS_HEX
  20. #define IS_HEX(c) (IS_NUM(c) || ((c) >= 'a' && (c) <= 'f') || ((c) >= 'A' && (c) <= 'F'))
  21. #endif
  22. #ifndef C2I
  23. #define C2I(c) ((c)-'0')
  24. #endif
  25. static char hex2i(char hex) {
  26. if (hex >= '0' && hex <= '9') {
  27. return hex - '0';
  28. }
  29. if (hex >= 'A' && hex <= 'F') {
  30. return hex - 'A';
  31. }
  32. if (hex >= 'a' && hex <= 'f') {
  33. return hex - 'a';
  34. }
  35. return 0;
  36. }
  37. // scheme:[//[user[:password]@]host[:port]][/path][?query][#fragment]
  38. static std::string escape(const std::string& param) {
  39. std::string str;
  40. const char* p = param.c_str();
  41. char escape[4] = {0};
  42. while (*p != '\0') {
  43. if (*p == ' ' ||
  44. *p == ':' ||
  45. *p == '/' ||
  46. *p == '@' ||
  47. *p == '?' ||
  48. *p == '=' ||
  49. *p == '&' ||
  50. *p == '#' ||
  51. *p == '%') {
  52. sprintf(escape, "%%%02X", *p);
  53. str += escape;
  54. }
  55. else {
  56. str += *p;
  57. }
  58. ++p;
  59. }
  60. return str;
  61. }
  62. static std::string unescape(const char* escape_param) {
  63. std::string str;
  64. const char* p = escape_param;
  65. while (*p != '\0') {
  66. if (*p == '%' &&
  67. IS_HEX(p[1]) &&
  68. IS_HEX(p[2])) {
  69. str += (hex2i(p[1]) << 4 | hex2i(p[2]));
  70. p += 3;
  71. continue;
  72. }
  73. str += *p;
  74. ++p;
  75. }
  76. return str;
  77. }
  78. std::string dump_query_params(QueryParams& query_params) {
  79. std::string query_string;
  80. for (auto& pair : query_params) {
  81. if (query_string.size() != 0) {
  82. query_string += '&';
  83. }
  84. query_string += escape(pair.first);
  85. query_string += '=';
  86. query_string += escape(pair.second);
  87. }
  88. return query_string;
  89. }
  90. int parse_query_params(const char* query_string, QueryParams& query_params) {
  91. const char* p = strchr(query_string, '?');
  92. p = p ? p+1 : query_string;
  93. p = unescape(p).c_str();
  94. enum {
  95. s_key,
  96. s_value,
  97. } state = s_key;
  98. const char* key = p;
  99. const char* value = NULL;
  100. int key_len = 0;
  101. int value_len = 0;
  102. while (*p != '\0') {
  103. if (*p == '&') {
  104. if (key_len && value_len) {
  105. query_params[std::string(key,key_len)] = std::string(value,value_len);
  106. key_len = value_len = 0;
  107. }
  108. state = s_key;
  109. key = p+1;
  110. }
  111. else if (*p == '=') {
  112. state = s_value;
  113. value = p+1;
  114. }
  115. else {
  116. state == s_key ? ++key_len : ++value_len;
  117. }
  118. ++p;
  119. }
  120. if (key_len && value_len) {
  121. query_params[std::string(key,key_len)] = std::string(value,value_len);
  122. key_len = value_len = 0;
  123. }
  124. return query_params.size() == 0 ? -1 : 0;
  125. }
  126. std::string dump_json(Json& json) {
  127. return json.dump();
  128. }
  129. std::string g_parse_json_errmsg;
  130. int parse_json(const char* str, Json& json, std::string& errmsg) {
  131. try {
  132. json = Json::parse(str);
  133. }
  134. catch(nlohmann::detail::exception e) {
  135. errmsg = e.what();
  136. return -1;
  137. }
  138. return (json.is_discarded() || json.is_null()) ? -1 : 0;
  139. }
  140. std::string dump_multipart(MultiPart& mp, const char* boundary) {
  141. char c_str[256] = {0};
  142. std::string str;
  143. for (auto& pair : mp) {
  144. str += "--";
  145. str += boundary;
  146. str += "\r\n";
  147. str += "Content-Disposition: form-data";
  148. snprintf(c_str, sizeof(c_str), "; name=\"%s\"", pair.first.c_str());
  149. str += c_str;
  150. auto& form = pair.second;
  151. if (form.filename.size() != 0) {
  152. if (form.content.size() == 0) {
  153. HFile file;
  154. if (file.open(form.filename.c_str(), "r") == 0) {
  155. file.readall(form.content);
  156. }
  157. }
  158. snprintf(c_str, sizeof(c_str), "; filename=\"%s\"", basename(form.filename).c_str());
  159. str += c_str;
  160. }
  161. str += "\r\n\r\n";
  162. str += form.content;
  163. str += "\r\n";
  164. }
  165. str += "--";
  166. str += boundary;
  167. str += "--";
  168. return str;
  169. }
  170. #include "multipart_parser.h"
  171. enum multipart_parser_state_e {
  172. MP_START,
  173. MP_PART_DATA_BEGIN,
  174. MP_HEADER_FIELD,
  175. MP_HEADER_VALUE,
  176. MP_HEADERS_COMPLETE,
  177. MP_PART_DATA,
  178. MP_PART_DATA_END,
  179. MP_BODY_END
  180. };
  181. struct multipart_parser_userdata {
  182. MultiPart* mp;
  183. // tmp
  184. multipart_parser_state_e state;
  185. std::string header_field;
  186. std::string header_value;
  187. std::string part_data;
  188. std::string name;
  189. std::string filename;
  190. void handle_header() {
  191. if (header_field.size() == 0 || header_value.size() == 0) return;
  192. if (stricmp(header_field.c_str(), "Content-Disposition") == 0) {
  193. StringList strlist = split(header_value, ';');
  194. for (auto& str : strlist) {
  195. StringList kv = split(trim(str, " "), '=');
  196. if (kv.size() == 2) {
  197. const char* key = kv.begin()->c_str();
  198. const char* value = trim_pairs(*(kv.begin()+1), "\"\"").c_str();
  199. if (strcmp(key, "name") == 0) {
  200. name = value;
  201. }
  202. else if (strcmp(key, "filename") == 0) {
  203. filename = value;
  204. }
  205. }
  206. }
  207. }
  208. header_field.clear();
  209. header_value.clear();
  210. }
  211. void handle_data() {
  212. if (name.c_str() != 0) {
  213. (*mp)[name] = FormData(part_data.c_str(), filename.c_str());
  214. }
  215. name.clear();
  216. filename.clear();
  217. part_data.clear();
  218. }
  219. };
  220. static int on_header_field(multipart_parser* parser, const char *at, size_t length) {
  221. printf("on_header_field:%.*s\n", (int)length, at);
  222. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  223. userdata->handle_header();
  224. userdata->state = MP_HEADER_FIELD;
  225. userdata->header_field.insert(userdata->header_field.size(), at, length);
  226. return 0;
  227. }
  228. static int on_header_value(multipart_parser* parser, const char *at, size_t length) {
  229. printf("on_header_value:%.*s\n", (int)length, at);
  230. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  231. userdata->state = MP_HEADER_VALUE;
  232. userdata->header_value.insert(userdata->header_value.size(), at, length);
  233. return 0;
  234. }
  235. static int on_part_data(multipart_parser* parser, const char *at, size_t length) {
  236. printf("on_part_data:%.*s\n", (int)length, at);
  237. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  238. userdata->state = MP_PART_DATA;
  239. userdata->part_data.insert(userdata->part_data.size(), at, length);
  240. return 0;
  241. }
  242. static int on_part_data_begin(multipart_parser* parser) {
  243. printf("on_part_data_begin\n");
  244. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  245. userdata->state = MP_PART_DATA_BEGIN;
  246. return 0;
  247. }
  248. static int on_headers_complete(multipart_parser* parser) {
  249. printf("on_headers_complete\n");
  250. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  251. userdata->handle_header();
  252. userdata->state = MP_HEADERS_COMPLETE;
  253. return 0;
  254. }
  255. static int on_part_data_end(multipart_parser* parser) {
  256. printf("on_part_data_end\n");
  257. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  258. userdata->state = MP_PART_DATA_END;
  259. userdata->handle_data();
  260. return 0;
  261. }
  262. static int on_body_end(multipart_parser* parser) {
  263. printf("on_body_end\n");
  264. multipart_parser_userdata* userdata = (multipart_parser_userdata*)multipart_parser_get_data(parser);
  265. userdata->state = MP_BODY_END;
  266. return 0;
  267. }
  268. int parse_multipart(std::string& str, MultiPart& mp, const char* boundary) {
  269. printf("boundary=%s\n", boundary);
  270. std::string __boundary("--");
  271. __boundary += boundary;
  272. multipart_parser_settings settings;
  273. settings.on_header_field = on_header_field;
  274. settings.on_header_value = on_header_value;
  275. settings.on_part_data = on_part_data;
  276. settings.on_part_data_begin = on_part_data_begin;
  277. settings.on_headers_complete = on_headers_complete;
  278. settings.on_part_data_end = on_part_data_end;
  279. settings.on_body_end = on_body_end;
  280. multipart_parser* parser = multipart_parser_init(__boundary.c_str(), &settings);
  281. multipart_parser_userdata userdata;
  282. userdata.state = MP_START;
  283. userdata.mp = &mp;
  284. multipart_parser_set_data(parser, &userdata);
  285. size_t nparse = multipart_parser_execute(parser, str.c_str(), str.size());
  286. multipart_parser_free(parser);
  287. return nparse == str.size() ? 0 : -1;
  288. }