parsing.c: enable builds with NO_ICONV defined

[cgit.git] / parsing.c
diff --git a/parsing.c b/parsing.c

index 36b0f0c93399f78c8fb3336efafda20cc1b417f2..f3f3b15f736521f267e87dd474fee0af5c961250 100644 (file)
--- a/parsing.c
+++ b/parsing.c
@@ -8,139 +8,112 @@
  
  #include "cgit.h"
  
-int next_char(FILE *f)
+/*
+ * url syntax: [repo ['/' cmd [ '/' path]]]
+ *   repo: any valid repo url, may contain '/'
+ *   cmd:  log | commit | diff | tree | view | blob | snapshot
+ *   path: any valid path, may contain '/'
+ *
+ */
+void cgit_parse_url(const char *url)
  {
-       int c = fgetc(f);
-       if (c=='\r') {
-               c = fgetc(f);
-               if (c!='\n') {
-                       ungetc(c, f);
-                       c = '\r';
-               }
-       }
-       return c;
-}
+       char *cmd, *p;
  
-void skip_line(FILE *f)
-{
-       int c;
+       ctx.repo = NULL;
+       if (!url || url[0] == '\0')
+               return;
  
-       while((c=next_char(f)) && c!='\n' && c!=EOF)
-               ;
-}
-
-int read_config_line(FILE *f, char *line, const char **value, int bufsize)
-{
-       int i = 0, isname = 0;
+       ctx.repo = cgit_get_repoinfo(url);
+       if (ctx.repo) {
+               ctx.qry.repo = ctx.repo->url;
+               return;
+       }
  
-       *value = NULL;
-       while(i<bufsize-1) {
-               int c = next_char(f);
-               if (!isname && (c=='#' || c==';')) {
-                       skip_line(f);
+       cmd = strchr(url, '/');
+       while (!ctx.repo && cmd) {
+               cmd[0] = '\0';
+               ctx.repo = cgit_get_repoinfo(url);
+               if (ctx.repo == NULL) {
+                       cmd[0] = '/';
+                       cmd = strchr(cmd + 1, '/');
                         continue;
                 }
-               if (!isname && isspace(c))
-                       continue;
  
-               if (c=='=' && !*value) {
-                       line[i] = 0;
-                       *value = &line[i+1];
-               } else if (c=='\n' && !isname) {
-                       i = 0;
-                       continue;
-               } else if (c=='\n' || c==EOF) {
-                       line[i] = 0;
-                       break;
-               } else {
-                       line[i]=c;
+               ctx.qry.repo = ctx.repo->url;
+               p = strchr(cmd + 1, '/');
+               if (p) {
+                       p[0] = '\0';
+                       if (p[1])
+                               ctx.qry.path = trim_end(p + 1, '/');
                 }
-               isname = 1;
-               i++;
+               if (cmd[1])
+                       ctx.qry.page = xstrdup(cmd + 1);
+               return;
         }
-       line[i+1] = 0;
-       return i;
  }
  
-int cgit_read_config(const char *filename, configfn fn)
+char *substr(const char *head, const char *tail)
  {
-       static int nesting;
-       int len;
-       char line[256];
-       const char *value;
-       FILE *f;
-
-       /* cancel deeply nested include-commands */
-       if (nesting > 8)
-               return -1;
-       if (!(f = fopen(filename, "r")))
-               return -1;
-       nesting++;
-       while((len = read_config_line(f, line, &value, sizeof(line))) > 0)
-               (*fn)(line, value);
-       nesting--;
-       fclose(f);
-       return 0;
-}
+       char *buf;
  
-char *convert_query_hexchar(char *txt)
-{
-       int d1, d2;
-       if (strlen(txt) < 3) {
-               *txt = '\0';
-               return txt-1;
-       }
-       d1 = hextoint(*(txt+1));
-       d2 = hextoint(*(txt+2));
-       if (d1<0 || d2<0) {
-               strcpy(txt, txt+3);
-               return txt-1;
-       } else {
-               *txt = d1 * 16 + d2;
-               strcpy(txt+1, txt+3);
-               return txt;
-       }
+       buf = xmalloc(tail - head + 1);
+       strncpy(buf, head, tail - head);
+       buf[tail - head] = '\0';
+       return buf;
  }
  
-int cgit_parse_query(char *txt, configfn fn)
+char *parse_user(char *t, char **name, char **email, unsigned long *date)
  {
-       char *t, *value = NULL, c;
+       char *p = t;
+       int mode = 1;
  
-       if (!txt)
-               return 0;
-
-       t = txt = xstrdup(txt);
-
-       while((c=*t) != '\0') {
-               if (c=='=') {
-                       *t = '\0';
-                       value = t+1;
-               } else if (c=='+') {
-                       *t = ' ';
-               } else if (c=='%') {
-                       t = convert_query_hexchar(t);
-               } else if (c=='&') {
-                       *t = '\0';
-                       (*fn)(txt, value);
-                       txt = t+1;
-                       value = NULL;
+       while (p && *p) {
+               if (mode == 1 && *p == '<') {
+                       *name = substr(t, p - 1);
+                       t = p;
+                       mode++;
+               } else if (mode == 1 && *p == '\n') {
+                       *name = substr(t, p);
+                       p++;
+                       break;
+               } else if (mode == 2 && *p == '>') {
+                       *email = substr(t, p + 1);
+                       t = p;
+                       mode++;
+               } else if (mode == 2 && *p == '\n') {
+                       *email = substr(t, p);
+                       p++;
+                       break;
+               } else if (mode == 3 && isdigit(*p)) {
+                       *date = atol(p);
+                       mode++;
+               } else if (*p == '\n') {
+                       p++;
+                       break;
                 }
-               t++;
+               p++;
         }
-       if (t!=txt)
-               (*fn)(txt, value);
-       return 0;
+       return p;
  }
  
-char *substr(const char *head, const char *tail)
+#ifdef NO_ICONV
+#define reencode(a, b, c)
+#else
+const char *reencode(char **txt, const char *src_enc, const char *dst_enc)
  {
-       char *buf;
+       char *tmp;
  
-       buf = xmalloc(tail - head + 1);
-       strncpy(buf, head, tail - head);
-       buf[tail - head] = '\0';
-       return buf;
+       if (!txt || !*txt || !src_enc || !dst_enc)
+               return *txt;
+
+       tmp = reencode_string(*txt, src_enc, dst_enc);
+       if (tmp) {
+               free(*txt);
+               *txt = tmp;
+       }
+       return *txt;
  }
+#endif
  
  struct commitinfo *cgit_parse_commit(struct commit *commit)
  {
@@ -155,6 +128,10 @@ struct commitinfo *cgit_parse_commit(struct commit *commit)
         ret->committer_email = NULL;
         ret->subject = NULL;
         ret->msg = NULL;
+       ret->msg_encoding = NULL;
+
+       if (p == NULL)
+               return ret;
  
         if (strncmp(p, "tree ", 5))
                 die("Bad commit: %s", sha1_to_hex(commit->object.sha1));
@@ -164,40 +141,59 @@ struct commitinfo *cgit_parse_commit(struct commit *commit)
         while (!strncmp(p, "parent ", 7))
                 p += 48; // "parent " + hex[40] + "\n"
  
-       if (!strncmp(p, "author ", 7)) {
-               p += 7;
-               t = strchr(p, '<') - 1;
-               ret->author = substr(p, t);
-               p = t;
-               t = strchr(t, '>') + 1;
-               ret->author_email = substr(p, t);
-               ret->author_date = atol(++t);
-               p = strchr(t, '\n') + 1;
+       if (p && !strncmp(p, "author ", 7)) {
+               p = parse_user(p + 7, &ret->author, &ret->author_email,
+                       &ret->author_date);
+       }
+
+       if (p && !strncmp(p, "committer ", 9)) {
+               p = parse_user(p + 9, &ret->committer, &ret->committer_email,
+                       &ret->committer_date);
         }
  
-       if (!strncmp(p, "committer ", 9)) {
+       if (p && !strncmp(p, "encoding ", 9)) {
                 p += 9;
-               t = strchr(p, '<') - 1;
-               ret->committer = substr(p, t);
-               p = t;
-               t = strchr(t, '>') + 1;
-               ret->committer_email = substr(p, t);
-               ret->committer_date = atol(++t);
-               p = strchr(t, '\n') + 1;
+               t = strchr(p, '\n');
+               if (t) {
+                       ret->msg_encoding = substr(p, t + 1);
+                       p = t + 1;
+               }
+       }
+
+       // skip unknown header fields
+       while (p && *p && (*p != '\n')) {
+               p = strchr(p, '\n');
+               if (p)
+                       p++;
         }
  
-       while (*p == '\n')
-               p = strchr(p, '\n') + 1;
+       // skip empty lines between headers and message
+       while (p && *p == '\n')
+               p++;
+
+       if (!p)
+               return ret;
  
         t = strchr(p, '\n');
-       if (t && *t) {
+       if (t) {
                 ret->subject = substr(p, t);
                 p = t + 1;
  
-               while (*p == '\n')
-                       p = strchr(p, '\n') + 1;
-               ret->msg = p;
+               while (p && *p == '\n') {
+                       p = strchr(p, '\n');
+                       if (p)
+                               p++;
+               }
+               if (p)
+                       ret->msg = xstrdup(p);
+       } else
+               ret->subject = xstrdup(p);
+
+       if (ret->msg_encoding) {
+               reencode(&ret->subject, PAGE_ENCODING, ret->msg_encoding);
+               reencode(&ret->msg, PAGE_ENCODING, ret->msg_encoding);
         }
+
         return ret;
  }
  
@@ -207,7 +203,7 @@ struct taginfo *cgit_parse_tag(struct tag *tag)
         void *data;
         enum object_type type;
         unsigned long size;
-       char *p, *t;
+       char *p;
         struct taginfo *ret;
  
         data = read_sha1_file(tag->object.sha1, &type, &size);
@@ -229,19 +225,19 @@ struct taginfo *cgit_parse_tag(struct tag *tag)
                         break;
  
                 if (!strncmp(p, "tagger ", 7)) {
-                       p += 7;
-                       t = strchr(p, '<') - 1;
-                       ret->tagger = substr(p, t);
-                       p = t;
-                       t = strchr(t, '>') + 1;
-                       ret->tagger_email = substr(p, t);
-                       ret->tagger_date = atol(++t);
+                       p = parse_user(p + 7, &ret->tagger, &ret->tagger_email,
+                               &ret->tagger_date);
+               } else {
+                       p = strchr(p, '\n');
+                       if (p)
+                               p++;
                 }
-               p = strchr(p, '\n') + 1;
         }
  
-       while (p && (*p == '\n'))
-               p = strchr(p, '\n') + 1;
+       // skip empty lines between headers and message
+       while (p && *p == '\n')
+               p++;
+
         if (p && *p)
                 ret->msg = xstrdup(p);
         free(data);