diff options
author | epoch <epoch@hacking.allowed.org> | 2020-11-15 19:12:05 -0600 |
---|---|---|
committer | epoch <epoch@hacking.allowed.org> | 2020-11-15 19:12:05 -0600 |
commit | 33c881b546d40fe88ee0a8988c654d2563d38582 (patch) | |
tree | c81d389feb917efc75c0a1d3662b9a52df8ac20d | |
parent | 4f9509b7fe0e345f5d8fa7540adba45b1a363f81 (diff) | |
parent | 07f78f990a68eda368d3e195edf34d42a196583e (diff) | |
download | uritools-33c881b546d40fe88ee0a8988c654d2563d38582.tar.gz uritools-33c881b546d40fe88ee0a8988c654d2563d38582.zip |
merge conflict resolved
-rw-r--r-- | .gitignore | 1 | ||||
-rw-r--r-- | Makefile | 8 | ||||
-rw-r--r-- | shorten.c | 37 | ||||
-rwxr-xr-x | urititle | 48 |
4 files changed, 86 insertions, 8 deletions
@@ -4,3 +4,4 @@ uriescape urimatch uriunescape urijoin +shorten @@ -2,7 +2,10 @@ CFLAGS:=-std=c11 -pedantic -Wall PREFIX:=/usr/local CC:=gcc -all: urimatch uricut urijoin uricmp uriunescape uriescape +all: urimatch uricut urijoin uricmp uriunescape uriescape shorten + +shorten: LDFLAGS=-lcrypto +shorten: shorten.c urimatch: urimatch.c uri.h @@ -39,3 +42,6 @@ install: all install -t $(PREFIX)/bin query_param install -t $(PREFIX)/bin data_handler install -t $(PREFIX)/bin unshorten.sh + install -t $(PREFIX)/bin shorten + chgrp shorten $(PREFIX)/bin/shorten + chmod g+s $(PREFIX)/bin/shorten diff --git a/shorten.c b/shorten.c new file mode 100644 index 0000000..ac76d84 --- /dev/null +++ b/shorten.c @@ -0,0 +1,37 @@ +#define _POSIX_C_SOURCE 200908 +#include <stdio.h> +#include <sys/stat.h> +#include <openssl/md5.h> +#include <string.h> +//#include <sys/types.h> +#include <sys/xattr.h> + +#define BYTES_IN_SHORT 2 +#define CACHE_DIR "/var/cache/shorten" + +int main(int argc,char *argv[]) { + int i; + if(argc < 2) return 1; + unsigned char *p=MD5((unsigned char *)argv[1],strlen(argv[1]),NULL); + char filepath[4096];//too long, oh well + char out[256]; + char tmp[3]; + strcpy(out,""); + for(i=0;i<BYTES_IN_SHORT;i++) { + snprintf(tmp,sizeof(tmp),"%02x",p[i]); + strcat(out,tmp); + } + printf("%s\n",out); + snprintf(filepath,sizeof(filepath)-1,"%s/%s",CACHE_DIR,out); + FILE *fp; + if((fp=fopen(filepath,"w")) == NULL) { + fprintf(stderr,"shorten: failed to write a file: %s\n",filepath); + return 1; + } + fprintf(fp,"%s\n",argv[1]); + //disabled for now because tmpfs can't do extended attributes + //fprintf(stderr,"fsetxattr return: %d\n",fsetxattr(fileno(fp),"user.mime-type","text/uri-list",strlen("text/uri-list"),0)); + //perror("fsetxattr"); + fchmod(fileno(fp),0664); + fclose(fp); +} @@ -1,4 +1,4 @@ -#!/bin/sh +#!/usr/bin/env bash scheme=$(printf "%s\n" "$1" | uricut -s) path=$(printf "%s\n" "$1" | uricut -p) qs=$(printf "%s\n" "$1" | uricut -q) @@ -18,30 +18,64 @@ if [ "$qs" ];then fi case "$scheme" in http*) -if [ "$port" ];then + if [ "$port" ];then UA="Mozilla/5.0 (impersonator)" # content_type="$(printf "HEAD %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | grep -i '^Content-Type: ' | head -n1 | cut '-d ' -f2 | cut '-d;' -f1 | tr -d '\r\n')" - a_header="$(curl -Lsi "$1" | head -c 10000 | egrep -ai '^Location: |^Content-Type: ' | head -n1 | tr -d '\r\n')" + a_header="$((curl -Lsi "$1" || echo curl failed) | head -c 10000 | egrep -ai '^curl failed|^Location: |^Content-Type: ' | head -n1 | tr -d '\r\n')" if printf "%s\n" "${a_header}" | grep -i '^Content-Type: ' 2>&1 >/dev/null 2>&1;then content_type="$(printf '%s\n' "${a_header}" | cut '-d ' -f2- | cut '-d;' -f1)" - else - content_type="redirect probably" + fi + #if printf "%s\n" "${a_header}" | grep -i '^Location: ' 2>&1 >/dev/null 2>&1;then + # content_type="redirect. ${a_header}" + #fi + if printf "%s\n" "${a_hreader}" | grep -i '^curl failed' 2>&1 >/dev/null 2>&1;then + content_type="curl failed. cert expired? dunno yet. TODO: code openssl checker." fi if [ "${content_type}" = "text/html" -o "${content_type}" = "application/xhtml+xml" ];then # title="$(printf "GET %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | head -c 10000 | tr -d '\n' | tr '<' '\n' | grep -A 10 '^title>' | grep -B 10 '^\/title>' | cut '-d>' -f2)" title="$(curl -si "$1" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)" printf "title: %s\n" "$title" | html_entities_decode else - printf "%s\n" "${a_header}" + printf "%s %s\n" "${a_header}" "${content_type}" fi fi ;; gemini) - printf "title: %s\n" "$(gemini-get "$1" | grep '^#' | head -n1 | sed 's/^#* *//g')" + first=1 + gemini-get "$1" | while read -r line;do + if [ "$first" ];then + unset first + type="$(printf "%s\n" "$line" | tr -s ' ' | cut '-d ' -f2 | tr -d '\r')" + if [ "$type" != 'text/gemini' ];then + if [ "$type" = "text/html" ];then + head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep . + else + printf "title: %s\n" "$(printf "%s\n" "$line" | tr '\t' ' ' | tr -s ' ' | cut '-d ' -f2-)" + fi + fi + else + printf "title: %s\n" "$(printf "%s\n" "$line" | grep '^#' | sed 's/^#* *//g')" + fi + done | head -n1 ;; magnet) printf "title: %s\n" "$(printf "%s\n" "$1" | tr '&' '\n' | grep ^dn= | cut -d= -f2- | uriunescape)" ;; +ftp) + curl "$1" 2>&1 | tail -n1 + ;; +gopher) + type="$(printf "%s\n" "$1" | uricut -p | cut -b2- | cut -b1)" + if [ "$type" = 1 -o "$type" = "" ];then + printf "title: %s\n" "$(curl -s "$1" | grep ^i | head -n1 | cut -f1 | cut -b2-)" + elif [ "$type" = 0 ];then + printf "title: %s\n" "$(curl -s "$1" | head -n1)" + elif [ "$type" = "h" ];then + printf "title: %s\n" "$(curl -s "$1" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)" + else + printf "title: don't know how to get title of non-1 gopher links" + fi + ;; ssh) if [ ! "$port" ];then port=22 |