plan9fox/sys/src/cmd/webfs/url.c

413 lines
6.6 KiB
C

#include <u.h>
#include <libc.h>
#include <ctype.h>
#include <fcall.h>
#include <thread.h>
#include <9p.h>
#include "dat.h"
#include "fns.h"
static char reserved[] = "%:/?#[]@!$&'()*+,;=";
static int
dhex(char c)
{
if('0' <= c && c <= '9')
return c-'0';
if('a' <= c && c <= 'f')
return c-'a'+10;
if('A' <= c && c <= 'F')
return c-'A'+10;
return 0;
}
static char*
unescape(char *s, char *spec)
{
char *r, *w;
uchar x;
if(s == nil)
return s;
for(r=w=s; x = *r; r++){
if(x == '%' && isxdigit(r[1]) && isxdigit(r[2])){
x = (dhex(r[1])<<4)|dhex(r[2]);
if(spec && strchr(spec, x)){
*w++ = '%';
*w++ = toupper(r[1]);
*w++ = toupper(r[2]);
}
else
*w++ = x;
r += 2;
continue;
}
*w++ = x;
}
*w = 0;
return s;
}
int
Efmt(Fmt *f)
{
char *s, *spec;
Str2 s2;
s2 = va_arg(f->args, Str2);
s = s2.s1;
spec = s2.s2;
for(; *s; s++)
if(*s == '%' && isxdigit(s[1]) && isxdigit(s[2])){
fmtprint(f, "%%%c%c", toupper(s[1]), toupper(s[2]));
s += 2;
}
else if(isalnum(*s) || strchr(".-_~!$&'()*,;=", *s) || strchr(spec, *s))
fmtprint(f, "%c", *s);
else
fmtprint(f, "%%%.2X", *s & 0xff);
return 0;
}
int
Nfmt(Fmt *f)
{
char d[Domlen], *s;
s = va_arg(f->args, char*);
if(utf2idn(s, d, sizeof(d)) >= 0)
s = d;
fmtprint(f, "%s", s);
return 0;
}
int
Mfmt(Fmt *f)
{
char *s = va_arg(f->args, char*);
fmtprint(f, (*s != '[' && strchr(s, ':') != nil)? "[%s]" : "%s", s);
return 0;
}
int
Ufmt(Fmt *f)
{
char *s;
Url *u;
if((u = va_arg(f->args, Url*)) == nil)
return fmtprint(f, "nil");
if(u->scheme)
fmtprint(f, "%s:", u->scheme);
if(u->user || u->host)
fmtprint(f, "//");
if(u->user){
fmtprint(f, "%E", (Str2){u->user, ""});
if(u->pass)
fmtprint(f, ":%E", (Str2){u->pass, ""});
fmtprint(f, "@");
}
if(u->host){
fmtprint(f, "%]", u->host);
if(u->port)
fmtprint(f, ":%s", u->port);
}
if(s = Upath(u))
fmtprint(f, "%E", (Str2){s, "/:@+"});
if(u->query)
fmtprint(f, "?%E", (Str2){u->query, "/:@"});
if(u->fragment)
fmtprint(f, "#%E", (Str2){u->fragment, "/:@?+"});
return 0;
}
char*
Upath(Url *u)
{
if(u){
if(u->path)
return u->path;
if(u->user || u->host)
return "/";
}
return nil;
}
static char*
remdot(char *s)
{
char *b, *d, *p;
int dir, n;
dir = 1;
b = d = s;
if(*s == '/')
s++;
for(; s; s = p){
if(p = strchr(s, '/'))
*p++ = 0;
if(*s == '.' && ((s[1] == 0) || (s[1] == '.' && s[2] == 0))){
if(s[1] == '.')
while(d > b)
if(*--d == '/')
break;
dir = 1;
continue;
} else
dir = (p != nil);
if((n = strlen(s)) > 0)
memmove(d+1, s, n);
*d++ = '/';
d += n;
}
if(dir)
*d++ = '/';
*d = 0;
return b;
}
static char*
abspath(char *s, char *b)
{
char *x, *a;
if(b && *b){
if(s == nil || *s == 0)
return estrdup(b);
if(*s != '/' && (x = strrchr(b, '/'))){
a = emalloc((x - b) + strlen(s) + 4);
sprint(a, "%.*s/%s", utfnlen(b, x - b), b, s);
return remdot(a);
}
}
if(s && *s){
if(*s != '/')
return estrdup(s);
a = emalloc(strlen(s) + 4);
sprint(a, "%s", s);
return remdot(a);
}
return nil;
}
static void
pstrdup(char **p)
{
if(p == nil || *p == nil)
return;
if(**p == 0){
*p = nil;
return;
}
*p = estrdup(*p);
}
static char*
mklowcase(char *s)
{
char *cp;
Rune r;
if(s == nil)
return s;
cp = s;
while(*cp != 0){
chartorune(&r, cp);
r = tolowerrune(r);
cp += runetochar(cp, &r);
}
return s;
}
Url*
url(char *s, Url *b)
{
char *t, *p, *x, *y;
Url *u;
if(s == nil)
s = "";
t = nil;
s = p = estrdup(s);
u = emalloc(sizeof(*u));
for(; *p; p++){
if(*p == ':'){
if(p == s)
break;
*p++ = 0;
u->scheme = s;
b = nil;
goto Abs;
}
if(!isalpha(*p))
if((p == s) || ((!isdigit(*p) && strchr("+-.", *p) == nil)))
break;
}
p = s;
if(b){
switch(*p){
case 0:
memmove(u, b, sizeof(*u));
goto Out;
case '#':
memmove(u, b, sizeof(*u));
u->fragment = p+1;
goto Out;
case '?':
memmove(u, b, sizeof(*u));
u->fragment = u->query = nil;
break;
case '/':
if(p[1] == '/'){
u->scheme = b->scheme;
b = nil;
break;
}
default:
memmove(u, b, sizeof(*u));
u->fragment = u->query = u->path = nil;
break;
}
}
Abs:
if(x = strchr(p, '#')){
*x = 0;
u->fragment = x+1;
}
if(x = strchr(p, '?')){
*x = 0;
u->query = x+1;
}
if(p[0] == '/' && p[1] == '/'){
p += 2;
if(x = strchr(p, '/')){
u->path = t = abspath(x, Upath(b));
*x = 0;
}
if(x = strchr(p, '@')){
*x = 0;
if(y = strchr(p, ':')){
*y = 0;
u->pass = y+1;
}
u->user = p;
p = x+1;
}
if((x = strrchr(p, ']')) == nil)
x = p;
if(x = strrchr(x, ':')){
*x = 0;
u->port = x+1;
}
if(x = strchr(p, '[')){
p = x+1;
if(y = strchr(p, ']'))
*y = 0;
}
u->host = p;
} else {
u->path = t = abspath(p, Upath(b));
}
Out:
pstrdup(&u->scheme);
pstrdup(&u->user);
pstrdup(&u->pass);
pstrdup(&u->host);
pstrdup(&u->port);
pstrdup(&u->path);
pstrdup(&u->query);
pstrdup(&u->fragment);
free(s);
free(t);
/* the + character encodes space only in query part */
if(s = u->query)
while(s = strchr(s, '+'))
*s++ = ' ';
if(s = u->host){
t = emalloc(Domlen);
if(idn2utf(s, t, Domlen) >= 0){
u->host = estrdup(t);
free(s);
}
free(t);
}
unescape(u->user, nil);
unescape(u->pass, nil);
unescape(u->path, reserved);
unescape(u->query, reserved);
unescape(u->fragment, reserved);
mklowcase(u->scheme);
mklowcase(u->host);
mklowcase(u->port);
return u;
}
Url*
saneurl(Url *u)
{
if(u == nil || u->scheme == nil || u->host == nil || Upath(u) == nil){
freeurl(u);
return nil;
}
if(u->port){
/* remove default ports */
switch(atoi(u->port)){
case 21: if(!strcmp(u->scheme, "ftp")) goto Defport; break;
case 70: if(!strcmp(u->scheme, "gopher"))goto Defport; break;
case 80: if(!strcmp(u->scheme, "http")) goto Defport; break;
case 443: if(!strcmp(u->scheme, "https")) goto Defport; break;
default: if(!strcmp(u->scheme, u->port)) goto Defport; break;
Defport:
free(u->port);
u->port = nil;
}
}
return u;
}
int
matchurl(Url *u, Url *s)
{
if(u){
char *a, *b;
if(s == nil)
return 0;
if(u->scheme && (s->scheme == nil || strcmp(u->scheme, s->scheme)))
return 0;
if(u->user && (s->user == nil || strcmp(u->user, s->user)))
return 0;
if(u->host && (s->host == nil || strcmp(u->host, s->host)))
return 0;
if(u->port && (s->port == nil || strcmp(u->port, s->port)))
return 0;
if(a = Upath(u)){
b = Upath(s);
if(b == nil || strncmp(a, b, strlen(a)))
return 0;
}
}
return 1;
}
void
freeurl(Url *u)
{
if(u == nil)
return;
free(u->scheme);
free(u->user);
free(u->pass);
free(u->host);
free(u->port);
free(u->path);
free(u->query);
free(u->fragment);
free(u);
}