blob: 2a02e0fdfb05f136344e9e7ffdfdc83be5521895 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
|
#!/usr/bin/env bash
uri="$1"
scheme=$(printf "%s\n" "$uri" | uricut -s)
path=$(printf "%s\n" "$uri" | uricut -p)
qs=$(printf "%s\n" "$uri" | uricut -q)
domain=$(printf "%s\n" "$uri" | uricut -d)
port=$(printf "%s\n" "$uri" | uricut -P)
if [ "$scheme" = "http" -o "$scheme" = "https" ];then
## dereference ONLY ONCE. give up after that.
newuri="$(unshorten.sh "$uri")"
if [ "$newuri" ];then
uri="$newuri"
fi
# newuri="$(unshorten.sh "$uri")"
# if [ "$newuri" ];then
# uri="$newuri"
# fi
fi
if [ ! "$port" ];then
if [ "$scheme" = "https" ];then
port=443
SSL=--ssl
fi
if [ "$scheme" = "http" ];then
port=80
fi
fi
case "$scheme" in
http*)
if [ "$qs" ];then
path="${path}?${qs}"
fi
if [ "$port" ];then
UA="Mozilla/5.0 (impersonator)"
# content_type="$(printf "HEAD %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | grep -i '^Content-Type: ' | head -n1 | cut '-d ' -f2 | cut '-d;' -f1 | tr -d '\r\n')"
a_header="$((curl -gA "$UA" -Lsi "$uri" || echo curl failed) | head -c 10000 | egrep -ai '^curl failed|^Location: |^Content-Type: ' | head -n1 | tr -d '\r\n')"
if printf "%s\n" "${a_header}" | grep -i '^Content-Type: ' 2>&1 >/dev/null 2>&1;then
content_type="$(printf '%s\n' "${a_header}" | cut '-d ' -f2- | cut '-d;' -f1)"
fi
#if printf "%s\n" "${a_header}" | grep -i '^Location: ' 2>&1 >/dev/null 2>&1;then
# content_type="redirect. ${a_header}"
#fi
if printf "%s\n" "${a_hreader}" | grep -i '^curl failed' 2>&1 >/dev/null 2>&1;then
content_type="curl failed. cert expired? dunno yet. TODO: code openssl checker."
fi
### main.lv doesn't have content-type on some pages, so if the content-type is missing or empty, we're assuming html
if [ "${content_type}" = "text/html" -o "${content_type}" = "application/xhtml+xml" -o "${content_type}" = "" ];then
# title="$(printf "GET %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | head -c 10000 | tr -d '\n' | tr '<' '\n' | grep -A 10 '^title>' | grep -B 10 '^\/title>' | cut '-d>' -f2)"
title="$(curl -gsi "$uri" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)"
if [ "${content_type}" = "" ];then
printf "WTF: header: %s\n" "${a_header}"
printf "WARNING: NO CONTENT-TYPE RETURNED FROM SERVER. Assuming text/html. title: %s\n" "$title" | html_entities_decode
else
printf "title: %s\n" "$title" | html_entities_decode
fi
else
p rintf "%s\n" "${a_header}"
fi
fi
;;
gemini)
if [ "$qs" ];then
path="${path}?${qs}"
fi
first=1
gemini-get "$uri" | while read -r line;do
if [ "$first" ];then
unset first
type="$(printf "%s\n" "$line" | tr -s ' ' | cut '-d ' -f2 | tr -d '\r')"
if [ "$type" != 'text/gemini' ];then
if [ "$type" = "text/html" ];then
head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .
elif [ "$type" = "text/plain" ];then
printf "title: %s\n" "$(head -n1)"
else
printf "title: %s\n" "$(printf "%s\n" "$line" | tr '\t' ' ' | tr -s ' ' | cut '-d ' -f2-)"
fi
fi
else
printf "title: %s\n" "$(printf "%s\n" "$line" | grep '^#' | sed 's/^#* *//g')"
fi
done | head -n1
;;
magnet)
printf "title: %s\n" "$(printf "%s\n" "$uri" | tr '&' '\n' | grep ^dn= | cut -d= -f2- | uriunescape)"
;;
dns)
if [ "$qs" ] ; then
export QUERY_STRING="$(printf "%s\n" "$qs" | tr 'A-Z' 'a-z' | tr ';' '&')"
if [ "$(query_param type)" ];then
type="-t $(query_param "type")"
fi
if [ "$(query_param class)" ];then
class="-c $(query_param "class")"
fi
fi
if [ "$domain" ];then
server="@$domain"
path="$(printf "%s\n" "$path" | sed "s|^/||")"
else
server=""
fi
dig $class $type "$path" +short $server | tr '\n' ' ' | sed 's/ $/\n/'
;;
ftp)
curl -g "$uri" 2>&1 | tail -n1
;;
gopher)
if [ "$qs" ];then
path="${path}?${qs}"
fi
type="$(printf "%s\n" "$uri" | uricut -p | cut -b2- | cut -b1)"
if [ "$type" = 1 -o "$type" = "" ];then
printf "title: %s\n" "$(curl -gs "$uri" | grep ^i | head -n1 | cut -f1 | cut -b2-)"
elif [ "$type" = 0 ];then
printf "title: %s\n" "$(curl -gs "$uri" | head -n1)"
elif [ "$type" = "h" ];then
printf "title: %s\n" "$(curl -gs "$uri" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)"
else
printf "title: don't know how to get title of non-1 gopher links"
fi
;;
urn)
nid="$(printf "%s\n" "$uri" | cut -d: -f2)"
nss="$(printf "%s\n" "$uri" | cut -d: -f3)"
nss2="$(printf "%s\n" "$uri" | cut -d: -f4)"
if [ "$nid" = "ietf" ];then
if [ "$nss" = "rfc" ];then
cat "/var/db/rfc/rfc${nss2}.json" | jq .title
exit 0
fi
fi
if [ "$nid" = "phrack" ];then
if [ ! "${nss2}" ];then
printf "issue %s of phrack has %d articles\n" "${nss}" "$(grep -c '.' /var/db/phrack/meta/${nss}.tsv)"
exit 0
fi
cat /var/db/phrack/meta/${nss}.tsv | grep "^${nss}/${nss2}"$'\t' | sed 's|/|\t|' | tr '\n\t' '\0\0' | xargs -n4 -0 printf 'issue %2s article %2s %79s by [%s]\n'
exit 0
fi
if [ "$nid" = "mitre" ];then
if [ "$nss" = "cve" ];then
urititle "$(urnresolve "$uri")"
exit 0
fi
fi
urnresolve "$uri"
;;
ssh)
if [ ! "$port" ];then
port=22
fi
printf "title: %s\n" "$(printf "" | nc "$domain" "$port" | head -n1)"
;;
file)
file="$(uriunescape "$path")"
if [ -e "$file" ];then
mime-type -v "$file"
else
printf "file '%s' doesn't exist.\n" "$file"
fi
;;
*)
printf "DONT KNOW HOW TO GET TITLE FOR THIS URL: %s\n" "$uri"
esac
|