aboutsummaryrefslogtreecommitdiff
path: root/src/xml.c
blob: 66899970ecdf746e5775c2d0ff2ef4bfb4478721 (plain)
  1. #include <stdlib.h>
  2. #include <stdio.h>
  3. #include <string.h>
  4. #include <assert.h>
  5. #include "config.h"
  6. #include "cmark.h"
  7. #include "node.h"
  8. #include "buffer.h"
  9. #include "houdini.h"
  10. // Functions to convert cmark_nodes to XML strings.
  11. static void escape_xml(cmark_strbuf *dest, const unsigned char *source, int length)
  12. {
  13. if (source != NULL) {
  14. if (length < 0)
  15. length = strlen((char *)source);
  16. houdini_escape_html0(dest, source, (size_t)length, 0);
  17. }
  18. }
  19. struct render_state {
  20. cmark_strbuf* xml;
  21. int indent;
  22. };
  23. static inline void indent(struct render_state *state)
  24. {
  25. int i;
  26. for (i = 0; i < state->indent; i++) {
  27. cmark_strbuf_putc(state->xml, ' ');
  28. }
  29. }
  30. static int
  31. S_render_node(cmark_node *node, cmark_event_type ev_type,
  32. struct render_state *state, long options)
  33. {
  34. cmark_strbuf *xml = state->xml;
  35. bool literal = false;
  36. cmark_delim_type delim;
  37. bool entering = (ev_type == CMARK_EVENT_ENTER);
  38. if (entering) {
  39. indent(state);
  40. cmark_strbuf_printf(xml, "<%s",
  41. cmark_node_get_type_string(node));
  42. if (options & CMARK_OPT_SOURCEPOS && node->start_line != 0) {
  43. cmark_strbuf_printf(xml, " sourcepos=\"%d:%d-%d:%d\"",
  44. node->start_line,
  45. node->start_column,
  46. node->end_line,
  47. node->end_column);
  48. }
  49. literal = false;
  50. switch (node->type) {
  51. case CMARK_NODE_TEXT:
  52. case CMARK_NODE_CODE:
  53. case CMARK_NODE_HTML:
  54. case CMARK_NODE_INLINE_HTML:
  55. cmark_strbuf_puts(xml, ">");
  56. escape_xml(xml, node->as.literal.data,
  57. node->as.literal.len);
  58. cmark_strbuf_puts(xml, "</");
  59. cmark_strbuf_puts(xml,
  60. cmark_node_get_type_string(node));
  61. literal = true;
  62. break;
  63. case CMARK_NODE_LIST:
  64. switch (cmark_node_get_list_type(node)) {
  65. case CMARK_ORDERED_LIST:
  66. cmark_strbuf_puts(xml, " type=\"ordered\"");
  67. cmark_strbuf_printf(xml, " start=\"%d\"",
  68. cmark_node_get_list_start(node));
  69. delim = cmark_node_get_list_delim(node);
  70. if (delim == CMARK_PAREN_DELIM) {
  71. cmark_strbuf_puts(xml,
  72. " delim=\"paren\"");
  73. } else if (delim == CMARK_PERIOD_DELIM) {
  74. cmark_strbuf_puts(xml,
  75. " delim=\"period\"");
  76. }
  77. break;
  78. case CMARK_BULLET_LIST:
  79. cmark_strbuf_puts(xml, " type=\"bullet\"");
  80. break;
  81. default:
  82. break;
  83. }
  84. cmark_strbuf_printf(xml, " tight=\"%s\"",
  85. (cmark_node_get_list_tight(node) ?
  86. "true" : "false"));
  87. break;
  88. case CMARK_NODE_CODE_BLOCK:
  89. if (node->as.code.info.len > 0) {
  90. cmark_strbuf_puts(xml, " info=\"");
  91. escape_xml(xml, node->as.code.info.data,
  92. node->as.code.info.len);
  93. cmark_strbuf_putc(xml, '"');
  94. }
  95. cmark_strbuf_puts(xml, ">");
  96. escape_xml(xml, node->as.code.literal.data,
  97. node->as.code.literal.len);
  98. cmark_strbuf_puts(xml, "</");
  99. cmark_strbuf_puts(xml,
  100. cmark_node_get_type_string(node));
  101. literal = true;
  102. break;
  103. case CMARK_NODE_LINK:
  104. case CMARK_NODE_IMAGE:
  105. cmark_strbuf_puts(xml, " url=\"");
  106. escape_xml(xml, node->as.link.url, -1);
  107. cmark_strbuf_putc(xml, '"');
  108. cmark_strbuf_puts(xml, " title=\"");
  109. escape_xml(xml, node->as.link.title, -1);
  110. cmark_strbuf_putc(xml, '"');
  111. break;
  112. default:
  113. break;
  114. }
  115. if (node->first_child) {
  116. state->indent += 2;
  117. } else if (!literal) {
  118. cmark_strbuf_puts(xml, " /");
  119. }
  120. cmark_strbuf_puts(xml, ">\n");
  121. } else if (node->first_child) {
  122. state->indent -= 2;
  123. indent(state);
  124. cmark_strbuf_printf(xml, "</%s>\n",
  125. cmark_node_get_type_string(node));
  126. }
  127. return 1;
  128. }
  129. char *cmark_render_xml(cmark_node *root, long options)
  130. {
  131. char *result;
  132. cmark_strbuf xml = GH_BUF_INIT;
  133. cmark_event_type ev_type;
  134. cmark_node *cur;
  135. struct render_state state = { &xml, 0 };
  136. if (options & CMARK_OPT_NORMALIZE) {
  137. cmark_consolidate_text_nodes(root);
  138. }
  139. cmark_iter *iter = cmark_iter_new(root);
  140. cmark_strbuf_puts(state.xml,
  141. "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n");
  142. cmark_strbuf_puts(state.xml,
  143. "<!DOCTYPE CommonMark SYSTEM \"CommonMark.dtd\">\n");
  144. while ((ev_type = cmark_iter_next(iter)) != CMARK_EVENT_DONE) {
  145. cur = cmark_iter_get_node(iter);
  146. S_render_node(cur, ev_type, &state, options);
  147. }
  148. result = (char *)cmark_strbuf_detach(&xml);
  149. cmark_iter_free(iter);
  150. cmark_strbuf_free(&xml);
  151. return result;
  152. }