diff options
author | epochqwert <epoch@hacking.allowed.org> | 2015-08-22 03:36:15 -0500 |
---|---|---|
committer | epochqwert <epoch@hacking.allowed.org> | 2015-08-22 03:36:15 -0500 |
commit | b7849c483393cf510cbe4bca137ce4520b636685 (patch) | |
tree | 28e6410126fac350d69c9f47a7588f7dfd639841 /url.c | |
download | uritools-b7849c483393cf510cbe4bca137ce4520b636685.tar.gz uritools-b7849c483393cf510cbe4bca137ce4520b636685.zip |
initial commit.
Diffstat (limited to 'url.c')
-rw-r--r-- | url.c | 131 |
1 files changed, 131 insertions, 0 deletions
@@ -0,0 +1,131 @@ +//#include <stdio.h> +#include <string.h> +//#include <stdlib.h> + +/* + schemes are case sensitive but cononicals are lower case. + domain is case insensitive. return it lowercased? + port is optional and in decimal + path + scheme://username:password@domain:port/path?query_string#fragment_id + mailto:username@domain + + optional stuff: + scheme, username, password, port, path, query_string, fragment_id +*/ + +#include "url.h" + +/* +struct url { + char *scheme; + char *username; + char *password; + char *domain; + char *port; + char *path; + char *query_string; + char *fragment_id; +} +*/ + +void urlfromline(struct url *u,char *line) { + int i; + //split at first single / into line and path + for(i=0;line[i];i++) { + if(line[i] == '/' && line[i+1] == '/') { + i++; + continue; + } + if(line[i] == '/') { + line[i]=0; + u->path=line+i+1; + break; + } + } + if(u->path) { + if(strchr(u->path,'?')) { + u->query_string=strchr(u->path,'?'); + *u->query_string=0; + u->query_string++; + } + } + + if(u->query_string) { + if(strchr(u->query_string,'#')) { + u->fragment_id=strchr(u->query_string,'#'); + *u->fragment_id=0; + u->fragment_id++; + } + } + + if(strstr(line,"://")) { + u->scheme=line; + u->domain=strstr(line,"://"); + *u->domain=0; + u->domain+=3; + } else { + u->domain=line; + } + + if(u->domain) { + if(strchr(u->domain,'@')) { + u->username=u->domain; + u->domain=strchr(u->domain,'@'); + *u->domain=0; + u->domain++; + } + } + + if(u->username) { + if(strchr(u->username,':')) { + u->password=strchr(u->username,':'); + *u->password=0; + u->password++; + } + } + + if(u->domain) { + if(strchr(u->domain,']')) {//the end of an IPv6 address + if(strchr(strchr(u->domain,']'),':')) { + u->port=strchr(strchr(u->domain,']'),':'); + if(u->port[1] == '?') {//for magnet links + u->port=0; + } else { + *u->port=0; + u->port++; + } + } + } else { + if(strchr(u->domain,':')) { + u->port=strchr(u->domain,':'); + if(u->port[1] == '?') {//for magnet links + u->port=0; + } else { + *u->port=0; + u->port++; + } + } + } + } + + if(u->domain) {//for magnet links. + if(strchr(u->domain,'?')) { + u->query_string=strchr(u->domain,'?'); + *u->query_string=0; + u->query_string++; + } + } + + if(strchr(u->domain,':') && !strchr(u->domain,']')) {//for scheme:?query_string + u->scheme=u->domain; + *strchr(u->scheme,':')=0; + u->domain=0; + } + + if(!u->scheme && u->username) {//for mailto: + u->scheme=u->username; + u->username=u->password; + u->password=0; + } +} |