summaryrefslogtreecommitdiff
path: root/cmarkdown.c
diff options
context:
space:
mode:
authorgottox@rootkit.lan <gottox@rootkit.lan>2008-01-01 14:52:08 +0100
committergottox@rootkit.lan <gottox@rootkit.lan>2008-01-01 14:52:08 +0100
commit4f419311ff164306ae138bb363dbffa5797fbd12 (patch)
tree393794f3490c8440c6f874ca7eb716bafe4f9f0c /cmarkdown.c
parentd5058298da1fef8596066d1822a67d6a0eaff614 (diff)
renamed project to smu - simple markup
--HG-- rename : cmarkdown.1 => smu.1 rename : cmarkdown.c => smu.c
Diffstat (limited to 'cmarkdown.c')
-rw-r--r--cmarkdown.c537
1 files changed, 0 insertions, 537 deletions
diff --git a/cmarkdown.c b/cmarkdown.c
deleted file mode 100644
index f624593..0000000
--- a/cmarkdown.c
+++ /dev/null
@@ -1,537 +0,0 @@
-/* cmarkdown
- * Copyright (C) <2007> Enno boland <g s01 de>
- *
- * See LICENSE for further informations
- */
-
-#include <stdlib.h>
-#include <stdio.h>
-#include <stdarg.h>
-#include <string.h>
-
-#define BUFFERSIZE 512
-#define LENGTH(x) sizeof(x)/sizeof(x[0])
-#define ADDC(b,i) if(i % BUFFERSIZE == 0) \
- { b = realloc(b,(i + BUFFERSIZE) * sizeof(b)); if(!b) eprint("Malloc failed."); }; b[i]
-
-
-typedef unsigned int (*Parser)(const char *, const char *, int);
-struct Tag {
- char *search;
- int process;
- char *before, *after;
-};
-
-
-void eprint(const char *format, ...); /* Prints error and exits */
-unsigned int doamp(const char *begin, const char *end, int newblock);
- /* Parser for & */
-unsigned int dohtml(const char *begin, const char *end, int newblock);
- /* Parser for html */
-unsigned int dolineprefix(const char *begin, const char *end, int newblock);
- /* Parser for line prefix tags */
-unsigned int dolink(const char *begin, const char *end, int newblock);
- /* Parser for links and images */
-unsigned int dolist(const char *begin, const char *end, int newblock);
- /* Parser for lists */
-unsigned int doparagraph(const char *begin, const char *end, int newblock);
- /* Parser for paragraphs */
-unsigned int doreplace(const char *begin, const char *end, int newblock);
- /* Parser for simple replaces */
-unsigned int doshortlink(const char *begin, const char *end, int newblock);
- /* Parser for links and images */
-unsigned int dosurround(const char *begin, const char *end, int newblock);
- /* Parser for surrounding tags */
-unsigned int dounderline(const char *begin, const char *end, int newblock);
- /* Parser for underline tags */
-void hprint(const char *begin, const char *end); /* escapes HTML and prints it to stdout*/
-void process(const char *begin, const char *end, int isblock);
- /* Processes range between begin and end. */
-
-Parser parsers[] = { dounderline, dohtml, dolineprefix, dolist, doparagraph,
- dosurround, dolink, doshortlink, doamp, doreplace }; /* list of parsers */
-FILE *source;
-unsigned int bsize = 0, nohtml = 0;
-struct Tag lineprefix[] = {
- { " ", 0, "<pre><code>", "</code></pre>" },
- { "\t", 0, "<pre><code>", "</code></pre>" },
- { "> ", 2, "<blockquote>", "</blockquote>" },
- { "###### ", 1, "<h6>", "</h6>" },
- { "##### ", 1, "<h5>", "</h5>" },
- { "#### ", 1, "<h4>", "</h4>" },
- { "### ", 1, "<h3>", "</h3>" },
- { "## ", 1, "<h2>", "</h2>" },
- { "# ", 1, "<h1>", "</h1>" },
-};
-struct Tag underline[] = {
- { "=", 1, "<h1>", "</h1>\n" },
- { "-", 1, "<h2>", "</h2>\n" },
-};
-struct Tag surround[] = {
- { "``", 0, "<code>", "</code>" },
- { "`", 0, "<code>", "</code>" },
- { "__", 1, "<strong>", "</strong>" },
- { "**", 1, "<strong>", "</strong>" },
- { "*", 1, "<em>", "</em>" },
- { "_", 1, "<em>", "</em>" },
-};
-char * replace[][2] = {
- { "\n- - -\n", "\n<hr />\n" },
- { "\n- - - \n", "\n<hr />\n" },
- { " ######\n", "\n" },
- { " #####\n", "\n" },
- { " ####\n", "\n" },
- { " ###\n", "\n" },
- { " ##\n", "\n" },
- { " #\n", "\n" },
- { " >", "&gt;" },
- { "< ", "&lt;" },
- { "\\\\", "\\" },
- { "\\`", "`" },
- { "\\*", "*" },
- { "\\_", "_" },
- { "\\{", "{" },
- { "\\}", "}" },
- { "\\[", "[" },
- { "\\]", "]" },
- { "\\(", "(" },
- { "\\)", ")" },
- { "\\#", "#" },
- { "\\+", "+" },
- { "\\-", "-" },
- { "\\.", "." },
- { "\\!", "!" },
-};
-char * insert[][2] = {
- { " \n", "<br />" },
-};
-
-void
-eprint(const char *format, ...) {
- va_list ap;
-
- va_start(ap, format);
- vfprintf(stderr, format, ap);
- va_end(ap);
- exit(EXIT_FAILURE);
-}
-
-unsigned int
-doamp(const char *begin, const char *end, int newblock) {
- const char *p;
-
- if(*begin != '&')
- return 0;
- if(!nohtml) {
- for(p = begin + 1; !strchr("; \\\n\t",*p); p++);
- if(*p == ';')
- return 0;
- }
- fputs("&amp;",stdout);
- return 1;
-}
-
-unsigned int
-dohtml(const char *begin, const char *end, int newblock) {
- const char *p, *tag, *tagend;
-
- if(nohtml || !newblock || *begin == '\n')
- return 0;
- p = begin;
- if(p[1] == '\n')
- p++;
- if(p[1] != '<' || strchr(" /\n\t\\",p[2]))
- return 0;
- tag = p + 2;
- p += 2;
- for(; !strchr(" >",*p);p++);
- tagend = p;
- while((p = strstr(p,"\n</")) && p < end) {
- p+=3;
- if(strncmp(p, tag, tagend-tag) == 0 && p[tagend-tag] == '>') {
- p++;
- fwrite(begin, sizeof(char), p - begin + tagend - tag,stdout);
- puts("\n");
- return -(p - begin + tagend - tag);
- }
- }
- return 0;
-}
-
-unsigned int
-dolineprefix(const char *begin, const char *end, int newblock) {
- unsigned int i, j, l;
- char *buffer;
- const char *p;
-
- if(!newblock)
- return 0;
- p = begin;
- for(i = 0; i < LENGTH(lineprefix); i++) {
- l = strlen(lineprefix[i].search);
- if(end - p < l)
- continue;
- if(strncmp(lineprefix[i].search,p,l))
- continue;
- if(!(buffer = malloc(BUFFERSIZE)))
- eprint("Malloc failed.");
- buffer[0] = '\0';
- fputs(lineprefix[i].before,stdout);
- for(j = 0, p += l; p != end; p++, j++) {
- ADDC(buffer,j) = *p;
- if(*p == '\n') {
- if(strncmp(lineprefix[i].search,p+1,l) != 0)
- break;
- p += l;
- }
- }
- ADDC(buffer,j) = '\0';
- if(lineprefix[i].process)
- process(buffer,buffer+strlen(buffer), lineprefix[i].process >= 2);
- else
- hprint(buffer,buffer+strlen(buffer));
- puts(lineprefix[i].after);
- free(buffer);
- return -(p - begin);
- }
- return 0;
-}
-
-unsigned int
-dolink(const char *begin, const char *end, int newblock) {
- int img;
- const char *desc, *link, *p, *q, *descend, *linkend;
-
- if(*begin == '[')
- img = 0;
- else if(strncmp(begin,"![",2) == 0)
- img = 1;
- else
- return 0;
- p = desc = begin + 1 + img;
- if(!(p = strstr(desc, "](")) || p > end)
- return 0;
- for(q = strstr(desc, "!["); q && q < end && q < p; q = strstr(q+1,"!["))
- if(!(p = strstr(p+1, "](")) || p > end)
- return 0;
- descend = p;
- link = p + 2;
- if(!(p = strstr(link, ")")) || p > end)
- return 0;
- linkend = p;
- if(img) {
- fputs("<img src=\"",stdout);
- hprint(link,linkend);
- fputs("\" alt=\"",stdout);
- hprint(desc,descend);
- fputs("\" />",stdout);
- }
- else {
- fputs("<a href=\"",stdout);
- hprint(link,linkend);
- fputs("\">",stdout);
- process(desc,descend,0);
- fputs("</a>",stdout);
- }
- return p + 1 - begin;
-}
-
-unsigned int
-dolist(const char *begin, const char *end, int newblock) {
- unsigned int i, j, indent, run, ul, isblock;
- const char *p, *q;
- char *buffer;
-
- isblock = 0;
- if(newblock)
- p = begin;
- else if(*begin == '\n')
- p = begin + 1;
- else
- return 0;
- q = p;
- if(*p == '-' || *p == '*' || *p == '+')
- ul = 1;
- else {
- ul = 0;
- for(; *p && p != end && *p >= '0' && *p <= '9';p++);
- if(!*p || p[0] != '.')
- return 0;
- }
- if(p[1] != ' ' && p[1] != '\t')
- return 0;
- for(p++; *p && p != end && (*p == ' ' || *p == '\t'); p++);
- indent = p - q;
- if(!(buffer = malloc(BUFFERSIZE)))
- eprint("Malloc failed.");
- if(!newblock)
- putchar('\n');
- fputs(ul ? "<ul>\n" : "<ol>\n",stdout);
- run = 1;
- for(i = 0; *p && p < end && run; p++) {
- buffer[0] = '\0';
- for(i = 0; *p && p < end && run; p++,i++) {
- if(*p == '\n') {
- if(p[1] == '\n') {
- p++;
- ADDC(buffer,i) = '\n';
- i++;
- run = 0;
- isblock++;
- }
- q = p + 1;
- j = 0;
- if(ul && (*q == '-' || *q == '*' || *q == '+'))
- j = 1;
- else if(!ul) {
- for(; q[j] >= '0' && q[j] <= '9' && j < indent; j++);
- if(j > 0 && q[j] == '.')
- j++;
- else
- j = 0;
- }
- for(;(q[j] == ' ' || *q == '\t') && j < indent; j++);
- if(j == indent) {
- ADDC(buffer,i) = '\n';
- i++;
- p += indent;
- run = 1;
- if(*q == ' ' || *q == '\t')
- p++;
- else
- break;
- }
- }
- ADDC(buffer,i) = *p;
- }
- ADDC(buffer,i) = '\0';
- fputs("<li>",stdout);
- process(buffer,buffer+i,isblock > 1 || (isblock == 1 && run));
- fputs("</li>\n",stdout);
- }
- fputs(ul ? "</ul>\n" : "</ol>\n",stdout);
- free(buffer);
- p--;
- while(*(--p) == '\n');
- return -(p - begin + 1);
-}
-
-unsigned int
-doparagraph(const char *begin, const char *end, int newblock) {
- const char *p, *q;
-
- if(!newblock)
- return 0;
- p = begin;
- q = strstr(p, "\n\n");
- if(!q || q > end)
- q = end;
- if(q - begin <= 1)
- return 0;
- fputs("<p>\n",stdout);
- process(p,q,0);
- fputs("\n</p>\n",stdout);
- return -(q - begin);
-}
-
-unsigned int
-doreplace(const char *begin, const char *end, int newblock) {
- unsigned int i, l;
-
- for(i = 0; i < LENGTH(insert); i++)
- if(strncmp(insert[i][0],begin,strlen(insert[i][0])) == 0)
- fputs(insert[i][1], stdout);
- for(i = 0; i < LENGTH(replace); i++) {
- l = strlen(replace[i][0]);
- if(end - begin < l)
- continue;
- if(strncmp(replace[i][0],begin,l) == 0) {
- fputs(replace[i][1], stdout);
- return l;
- }
- }
- return 0;
-}
-
-unsigned int
-doshortlink(const char *begin, const char *end, int newblock) {
- const char *p, *c;
- int ismail = 0;
-
- if(*begin != '<')
- return 0;
- for(p = begin+1; p && p != end && !strchr(" \t\n",*p); p++) {
- switch(*p) {
- case '#':
- case ':':
- ismail = -1;
- break;
- case '@':
- if(ismail == 0)
- ismail = 1;
- break;
- case '>':
- if(ismail == 0)
- return 0;
- fputs("<a href=\"",stdout);
- if(ismail == 1) {
- /* mailto: */
- fputs("&#x6D;&#x61;i&#x6C;&#x74;&#x6F;:",stdout);
- for(c = begin+1; *c != '>'; c++) {
- printf("&#%u;",*c);
- }
- fputs("\">",stdout);
- for(c = begin+1; *c != '>'; c++) {
- printf("&#%u;",*c);
- }
- }
- else {
- hprint(begin+1,p);
- fputs("\">",stdout);
- hprint(begin+1,p);
- }
- fputs("</a>",stdout);
- return p - begin + 1;
- }
- }
- return 0;
-}
-
-unsigned int
-dosurround(const char *begin, const char *end, int newblock) {
- unsigned int i,l;
- const char *p, *ps, *q, *qend;
-
- for(i = 0; i < LENGTH(surround); i++) {
- l = strlen(surround[i].search);
- if(end - begin < l || strncmp(begin,surround[i].search,l) != 0)
- continue;
- for(ps = surround[i].search; *ps == '\n'; ps++);
- l = strlen(ps);
- p = begin + strlen(surround[i].search) - 1;
- do {
- p = strstr(p+1, ps);
- } while(p && p[-1] == '\\');
- if(!p || p > end)
- continue;
- fputs(surround[i].before,stdout);
- for(q = begin + strlen(surround[i].search); *q == ' '; q++);
- for(qend = p-1; *qend == ' '; qend--);
- if(surround[i].process)
- process(q, qend+1,0);
- else
- hprint(q, qend+1);
- fputs(surround[i].after,stdout);
- return p - begin + l;
- }
- return 0;
-}
-
-unsigned int
-dounderline(const char *begin, const char *end, int newblock) {
- unsigned int i, j, l;
- const char *p;
-
- if(!newblock)
- return 0;
- p = begin;
- for(l = 0; p[l] != '\n' && p[l] && p+l != end; l++);
- p += l + 1;
- if(l == 0)
- return 0;
- for(i = 0; i < LENGTH(underline); i++) {
- for(j = 0; p[j] != '\n' && p[j] == underline[i].search[0] && p+j != end; j++);
- if(j >= l) {
- fputs(underline[i].before,stdout);
- if(underline[i].process)
- process(begin, begin + l, 0);
- else
- hprint(begin, begin + l);
- fputs(underline[i].after,stdout);
- return -(j + p - begin);
- }
- }
- return 0;
-}
-
-void
-hprint(const char *begin, const char *end) {
- const char *p;
-
- for(p = begin; p && p != end; p++) {
- if(*p == '&')
- fputs("&amp;",stdout);
- else if(*p == '"')
- fputs("&quot;",stdout);
- else if(*p == '>')
- fputs("&gt;",stdout);
- else if(*p == '<')
- fputs("&lt;",stdout);
- else
- putchar(*p);
- }
-}
-
-void
-process(const char *begin, const char *end, int newblock) {
- const char *p, *q;
- int affected;
- unsigned int i;
-
- for(p = begin; *p && p < end;) {
- if(newblock)
- while(*p == '\n') p++;
- affected = 0;
- for(i = 0; i < LENGTH(parsers) && affected == 0; i++)
- affected = parsers[i](p, end, newblock);
- p += abs(affected);
- if(!affected) {
- if(nohtml)
- hprint(p,p+1);
- else
- putchar(*p);
- p++;
- }
- for(q = p; *q == '\n' && q < end; q++);
- if(q == end)
- return;
- else if(p[0] == '\n' && p[1] == '\n')
- newblock = 1;
- else
- newblock = affected < 0;
- }
-}
-
-int
-main(int argc, char *argv[]) {
- char *p, *buffer;
- int s;
-
- source = stdin;
- if(argc > 1 && strcmp("-v", argv[1]) == 0)
- eprint("markdown in C %s (C) Enno Boland\n",VERSION);
- else if(argc > 1 && strcmp("-h", argv[1]) == 0)
- eprint("Usage %s [-n] [file]\n -n escape html strictly\n",argv[0]);
- if(argc > 1 && strcmp("-n", argv[1]) == 0)
- nohtml = 1;
- if(argc > 1 + nohtml && strcmp("-", argv[1 + nohtml]) != 0
- && !(source = fopen(argv[1 + nohtml],"r")))
- eprint("Cannot open file `%s`\n",argv[1 + nohtml]);
- if(!(buffer = malloc(BUFFERSIZE)))
- eprint("Malloc failed.");
- bsize = BUFFERSIZE;
- buffer[0] = '\0';
- p = buffer+strlen(buffer);
- while((s = fread(p, sizeof(char),BUFFERSIZE, source))) {
- p += s;
- *p = '\0';
- if(BUFFERSIZE + strlen(buffer) > bsize) {
- bsize += BUFFERSIZE;
- if(!(buffer = realloc(buffer, bsize)))
- eprint("Malloc failed.");
- }
- }
- process(buffer,buffer+strlen(buffer),1);
- free(buffer);
- return EXIT_SUCCESS;
-}