microjson.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386
  1. /*
  2. * MIT License
  3. *
  4. * Copyright (c) 2020 Alexey Edelev <semlanik@gmail.com>
  5. *
  6. * This file is part of microjson project https://git.semlanik.org/semlanik/microjson
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy of this
  9. * software and associated documentation files (the "Software"), to deal in the Software
  10. * without restriction, including without limitation the rights to use, copy, modify,
  11. * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
  12. * to permit persons to whom the Software is furnished to do so, subject to the following
  13. * conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in all copies
  16. * or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
  19. * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
  20. * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
  21. * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  22. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  23. * DEALINGS IN THE SOFTWARE.
  24. */
  25. #include "microjson.h"
  26. #include <iostream>
  27. #ifdef MICROJSON_DEBUG
  28. #define microjsonDebug std::cout
  29. #else
  30. struct microjsonNull : public std::ostream {};
  31. static microjsonNull nullout;
  32. #define microjsonDebug nullout
  33. #endif
  34. namespace {
  35. template<const char expectedBeginByte>
  36. void lookForBoundaries(const char *buffer, size_t size, size_t &begin, size_t &end) {
  37. const char expectedEndByte = expectedBeginByte + 2;
  38. begin = SIZE_MAX;
  39. end = SIZE_MAX;
  40. for (size_t i = 0; i < size; i++) {
  41. const char beginByte = buffer[i];
  42. const char endByte = buffer[size - i - 1];
  43. if (begin == SIZE_MAX) {
  44. if (beginByte == expectedBeginByte) {
  45. begin = i;
  46. } else if (beginByte != '\n' && beginByte != ' ' && beginByte != '\r' && beginByte != '\t') {
  47. std::cerr << "Unexpected begin byte" << beginByte << std::endl;
  48. break;
  49. }
  50. }
  51. if (end == SIZE_MAX) {
  52. if (endByte == expectedEndByte) {
  53. end = size - i - 1;
  54. } else if (endByte != '\n' && endByte != ' ' && endByte != '\r' && endByte != '\t') {
  55. std::cerr << "Unexpected end byte" << endByte << std::endl;
  56. break;
  57. }
  58. }
  59. if (begin != SIZE_MAX && end != SIZE_MAX) {
  60. break;
  61. }
  62. }
  63. }
  64. void lookForName(const char *buffer, size_t size, size_t &i, microjson::JsonProperty &property) {
  65. property.nameBegin = SIZE_MAX;
  66. property.nameEnd = SIZE_MAX;
  67. bool beginFound = false;
  68. for(; i < size; ++i) {
  69. const char byte = buffer[i];
  70. if (microjson::skipWhiteSpace(byte)) {
  71. microjsonDebug << "Skip space" << std::endl;
  72. continue;
  73. }
  74. if(!beginFound) {
  75. if (byte == '"') {
  76. microjsonDebug << "Found name begin" << std::endl;
  77. property.nameBegin = i + 1;
  78. beginFound = true;
  79. } else {
  80. std::cerr << "Not found name begin, unexpected" << std::endl;
  81. break;
  82. }
  83. } else if(byte == '"') {
  84. if (i > 0 && buffer[i - 1] == '\\') {
  85. microjsonDebug << "'\"' found in name" << std::endl;
  86. continue;
  87. }
  88. microjsonDebug << "Found name end" << std::endl;
  89. property.nameEnd = i;
  90. break;
  91. }
  92. }
  93. ++i;
  94. }
  95. bool lookForSeparator(const char* buffer, size_t size, size_t &i) {
  96. bool found = false;
  97. for(; i < size; ++i) {
  98. const char byte = buffer[i];
  99. if (microjson::skipWhiteSpace(byte)) {
  100. microjsonDebug << "Skip space" << std::endl;
  101. continue;
  102. }
  103. if (byte == ':') {
  104. microjsonDebug << "Found Separator" << std::endl;
  105. found = true;
  106. }
  107. break;
  108. }
  109. ++i;
  110. return found;
  111. }
  112. void lookForValue(const char *buffer, size_t size, size_t &i, microjson::JsonProperty &property) {
  113. int valueBracesCounter = -1;
  114. int valueBracketsCounter = -1;
  115. int trueCounter = 3;
  116. int falseCounter = 4;
  117. std::function<bool(void)> valueEndMarker;
  118. bool beginFound = false;
  119. bool stringScope = false;
  120. property.valueBegin = SIZE_MAX;
  121. property.valueEnd = SIZE_MAX;
  122. for(; i < size; i++) {
  123. const char byte = buffer[i];
  124. if (!beginFound) {
  125. microjsonDebug << "lookForValue at: " << i << " byte: " << byte << std::endl;
  126. if (microjson::skipWhiteSpace(byte)) {
  127. microjsonDebug << "Skip space" << std::endl;
  128. continue;
  129. }
  130. switch (byte) {
  131. case '"':
  132. valueEndMarker = [&](){
  133. return buffer[i] == '"' && buffer[i - 1] != '\\';
  134. };
  135. property.type = microjson::JsonStringType;
  136. break;
  137. case '-':
  138. case '0':
  139. case '1':
  140. case '2':
  141. case '3':
  142. case '4':
  143. case '5':
  144. case '6':
  145. case '7':
  146. case '8':
  147. case '9':
  148. valueEndMarker = [&buffer, &i](){
  149. if (buffer[i] != '+'
  150. && buffer[i] != '-'
  151. && buffer[i] != '0'
  152. && buffer[i] != '1'
  153. && buffer[i] != '2'
  154. && buffer[i] != '3'
  155. && buffer[i] != '4'
  156. && buffer[i] != '5'
  157. && buffer[i] != '6'
  158. && buffer[i] != '7'
  159. && buffer[i] != '8'
  160. && buffer[i] != '9'
  161. && buffer[i] != 'e'
  162. && buffer[i] != '.') {
  163. i--;
  164. return true;
  165. }
  166. return false;
  167. };
  168. property.type = microjson::JsonNumberType;
  169. break;
  170. case '{':
  171. valueBracesCounter++;
  172. valueEndMarker = [&stringScope, &byte, &valueBracesCounter](){
  173. if (!stringScope) {
  174. switch (byte) {
  175. case '}':
  176. --valueBracesCounter;
  177. break;
  178. case '{':
  179. ++valueBracesCounter;
  180. break;
  181. default:
  182. break;
  183. }
  184. }
  185. return valueBracesCounter < 0;
  186. };
  187. property.type = microjson::JsonObjectType;
  188. break;
  189. case 't':
  190. valueEndMarker = [&trueCounter](){
  191. --trueCounter;
  192. return trueCounter == 0;
  193. };
  194. property.type = microjson::JsonBoolType;
  195. break;
  196. case 'f':
  197. valueEndMarker = [&falseCounter](){
  198. --falseCounter;
  199. return falseCounter == 0;
  200. };
  201. property.type = microjson::JsonBoolType;
  202. break;
  203. case '[':
  204. valueBracketsCounter++;
  205. valueEndMarker = [&stringScope, &byte, &valueBracketsCounter](){
  206. if(!stringScope) {
  207. switch(byte) {
  208. case ']':
  209. --valueBracketsCounter;
  210. break;
  211. case '[':
  212. ++valueBracketsCounter;
  213. break;
  214. default:
  215. break;
  216. }
  217. }
  218. return valueBracketsCounter < 0;
  219. };
  220. property.type = microjson::JsonArrayType;
  221. break;
  222. }
  223. if (valueEndMarker) {
  224. microjsonDebug << "Found value begin" << std::endl;
  225. property.valueBegin = i;
  226. beginFound = true;
  227. } else {
  228. break;
  229. }
  230. } else {
  231. if (byte == '"' && (i == 0 || buffer[i - 1] != '\\')) {
  232. stringScope = !stringScope;
  233. }
  234. if (valueEndMarker()) {
  235. microjsonDebug << "Found value end" << std::endl;
  236. property.valueEnd = i;
  237. break;
  238. }
  239. }
  240. }
  241. if (property.checkEof()) {
  242. property.valueEnd = size - 1; //EOF case
  243. microjsonDebug << "Found value end at EOF" << std::endl;
  244. }
  245. if (property.type == microjson::JsonStringType) {
  246. ++property.valueBegin;
  247. --property.valueEnd;
  248. }
  249. }
  250. void findSeparator(const char *buffer, size_t size, size_t &i, const char expectedEndByte) {
  251. while (++i < size) {
  252. if(!microjson::skipWhiteSpace(buffer[i])) {
  253. break;
  254. }
  255. }
  256. const char endByte = buffer[i];
  257. if (endByte == expectedEndByte) {
  258. if(++i != size) {
  259. i = SIZE_MAX;
  260. }
  261. } else if(endByte == ',') {
  262. ++i;
  263. } else {
  264. i = SIZE_MAX;
  265. }
  266. }
  267. bool extractValue(const char *buffer, size_t size, size_t &i, const char expectedEndByte, microjson::JsonProperty &property) {
  268. if (size == 0) {
  269. i = SIZE_MAX;
  270. return false;
  271. }
  272. lookForValue(buffer, size, i, property);
  273. findSeparator(buffer, size, i, expectedEndByte);
  274. return property.checkValue();
  275. }
  276. using Extractor = bool(*)(const char *, size_t, size_t &, const char, microjson::JsonProperty &);
  277. template<typename R,
  278. const char expectedBeginByte,
  279. Extractor extract,
  280. void(* collect)(const char *, R &, const microjson::JsonProperty &property)>
  281. R parseJsonCommon(const char *buffer, size_t size) {
  282. R returnValue;
  283. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  284. return returnValue;
  285. }
  286. size_t objectBeginPosition = SIZE_MAX;
  287. size_t objectEndPosition = SIZE_MAX;
  288. lookForBoundaries<expectedBeginByte>(buffer, size, objectBeginPosition, objectEndPosition);
  289. if (objectBeginPosition == SIZE_MAX || objectEndPosition == SIZE_MAX) {
  290. return returnValue;
  291. }
  292. microjson::JsonProperty property;
  293. buffer += objectBeginPosition + 1;//Skip '{'
  294. size = objectEndPosition - objectBeginPosition;//Do not skip '}'
  295. microjsonDebug << "Object buffer size: " << size << " buffer: " << std::string(buffer, size) << std::endl;
  296. size_t nextPosition = 0;
  297. while (nextPosition < size) {
  298. microjsonDebug << "nextPropertyPosition: " << nextPosition << "size: " << size << std::endl;
  299. if(extract(buffer, size, nextPosition, expectedBeginByte + 2, property)) {
  300. collect(buffer, returnValue, property);
  301. }
  302. }
  303. return returnValue;
  304. }
  305. void appendProperty(const char* buffer, microjson::JsonObject &obj, const microjson::JsonProperty &property){
  306. std::string name((buffer + property.nameBegin), property.nameSize());
  307. std::string value;
  308. if(property.valueSize() > 0) {
  309. value = std::string((buffer + property.valueBegin), property.valueSize());
  310. }
  311. microjsonDebug << "name: " << name << " value: " << value << std::endl;
  312. obj[name] = { value, property.type };
  313. };
  314. void appendValue(const char* buffer, microjson::JsonArray &values, const microjson::JsonProperty &property){
  315. std::string value = std::string((buffer + property.valueBegin), property.valueSize());
  316. microjsonDebug << "value: " << value << std::endl;
  317. values.push_back({value, property.type});
  318. };
  319. }
  320. bool microjson::extractProperty(const char *buffer, size_t size, size_t &i, const char expectedEndByte, microjson::JsonProperty &property) {
  321. if (size == 0) {
  322. i = SIZE_MAX;
  323. return false;
  324. }
  325. lookForName(buffer, size, i, property);
  326. if(property.nameBegin == SIZE_MAX && property.nameEnd == SIZE_MAX) {
  327. std::cerr << "Name not found" << std::endl;
  328. return false;
  329. }
  330. microjsonDebug << "Found name: " << std::string(buffer + property.nameBegin, property.nameSize()) << std::endl;
  331. if(!lookForSeparator(buffer, size, i)) {
  332. std::cerr << "Separator not found" << std::endl;
  333. return false;
  334. }
  335. lookForValue(buffer, size, i, property);
  336. microjsonDebug << "Found value: " << std::string(buffer + property.valueBegin, property.valueSize()) << std::endl;
  337. findSeparator(buffer, size, i, expectedEndByte);
  338. return property.check();
  339. }
  340. microjson::JsonObject microjson::parseJsonObject(const char *buffer, size_t size) {
  341. return parseJsonCommon<JsonObject, '{', extractProperty, appendProperty>(buffer, size);
  342. }
  343. microjson::JsonArray microjson::parseJsonArray(const char *buffer, size_t size) {
  344. return parseJsonCommon<JsonArray, '[', extractValue, appendValue>(buffer, size);
  345. }