#include #include #include #include /* * go from http with latin1 escapes to utf, * we assume that anything >= Runeself is already in utf */ char * httpunesc(HConnect *cc, char *s) { char *t, *v, *p; int c, n; Htmlesc *e; Rune r; v = halloc(cc, UTFmax*strlen(s) + 1); for(t = v; c = *s;){ if(c == '&'){ if(s[1] == '#' && (n = strtoul(s+2, &p, 10)) != 0 && *p == ';'){ r = n; t += runetochar(t, &r); s = p+1; continue; }else if(s[1] == '#' && (s[2] == 'x' || s[2] == 'X') && (n = strtoul(s+3, &p, 16)) != 0 && *p == ';'){ r = n; t += runetochar(t, &r); s = p+1; continue; } else { for(e = htmlesc; e->name != nil; e++) if(strncmp(e->name, s, strlen(e->name)) == 0) break; if(e->name != nil){ t += runetochar(t, &e->value); s += strlen(e->name); continue; } } } *t++ = c; s++; } *t = 0; return v; }