summaryrefslogtreecommitdiff
path: root/urititle
blob: 662201c5950fbf62baa98de2e89d989fd7c7ed5a (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
#!/usr/bin/env bash
scheme=$(printf "%s\n" "$1" | uricut -s)
path=$(printf "%s\n" "$1" | uricut -p)
qs=$(printf "%s\n" "$1" | uricut -q)
domain=$(printf "%s\n" "$1" | uricut -d)
port=$(printf "%s\n" "$1" | uricut -P)
if [ ! "$port" ];then
  if [ "$scheme" = "https" ];then
    port=443
    SSL=--ssl
  fi
  if [ "$scheme" = "http" ];then
    port=80
  fi
fi
if [ "$qs" ];then
  path="${path}?${qs}"
fi
case "$scheme" in
http*)
  if [ "$port" ];then
    UA="Mozilla/5.0 (impersonator)"
#  content_type="$(printf "HEAD %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | grep -i '^Content-Type: ' | head -n1 | cut '-d ' -f2 | cut '-d;' -f1 | tr -d '\r\n')"
    a_header="$((curl -Lsi "$1" || echo curl failed) | head -c 10000 | egrep -ai '^curl failed|^Location: |^Content-Type: ' | head -n1 | tr -d '\r\n')"
    if printf "%s\n" "${a_header}" | grep -i '^Content-Type: ' 2>&1 >/dev/null 2>&1;then
      content_type="$(printf '%s\n' "${a_header}" | cut '-d ' -f2- | cut '-d;' -f1)"
    fi
    #if printf "%s\n" "${a_header}" | grep -i '^Location: ' 2>&1 >/dev/null 2>&1;then
    #  content_type="redirect. ${a_header}"
    #fi
    if printf "%s\n" "${a_hreader}" | grep -i '^curl failed' 2>&1 >/dev/null 2>&1;then
      content_type="curl failed. cert expired? dunno yet. TODO: code openssl checker."
    fi
    if [ "${content_type}" = "text/html" -o "${content_type}" = "application/xhtml+xml" ];then
#    title="$(printf "GET %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\n\r\n" "$path" "$domain" "$UA" | ncat -4 $SSL "$domain" "$port" | head -c 10000 | tr -d '\n' | tr '<' '\n' | grep -A 10 '^title>' | grep -B 10 '^\/title>' | cut '-d>' -f2)"
      title="$(curl -si "$1" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)"
      printf "title: %s\n" "$title" | html_entities_decode
    else
      printf "%s %s\n" "${a_header}" "${content_type}"
    fi
  fi
  ;;
gemini)
  first=1
  gemini-get "$1" | while read -r line;do
    if [ "$first" ];then
      unset first
      type="$(printf "%s\n" "$line" | tr -s ' ' | cut '-d ' -f2 | tr -d '\r')"
      if [ "$type" != 'text/gemini' ];then
        if [ "$type" = "text/html" ];then
          head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .
        else
          printf "title: %s\n" "$(printf "%s\n" "$line" | tr '\t' ' ' | tr -s ' ' | cut '-d ' -f2-)"
        fi
      fi
    else
      printf "title: %s\n" "$(printf "%s\n" "$line" | grep '^#' | sed 's/^#* *//g')"
    fi
  done | head -n1
  ;;
magnet)
  printf "title: %s\n" "$(printf "%s\n" "$1" | tr '&' '\n' | grep ^dn= | cut -d= -f2- | uriunescape)"
  ;;
ftp)
  curl "$1" 2>&1 | tail -n1
  ;;
gopher)
  type="$(printf "%s\n" "$1" | uricut -p | cut -b2- | cut -b1)"
  if [ "$type" = 1 -o "$type" = "" ];then
    printf "title: %s\n" "$(curl -s "$1" | grep ^i | head -n1 | cut -f1 | cut -b2-)"
  elif [ "$type" = 0 ];then
    printf "title: %s\n" "$(curl -s "$1" | head -n1)"
  elif [ "$type" = "h" ];then
    printf "title: %s\n" "$(curl -s "$1" | head -c 1000000 | tr -d '\n' | tr '<' '\n' | grep -iA 10 '^title' | grep -iB 10 '^\/title>' | cut '-d>' -f2 | tr '\t' ' ' | sed 's/^ *//g' | sed 's/ *$//g' | grep .)"
  else
    printf "title: don't know how to get title of non-1 gopher links"
  fi
  ;;
ssh)
  if [ ! "$port" ];then
    port=22
  fi
  printf "title: %s\n" "$(printf "" | nc "$domain" "$port" | head -n1)"
  ;;
*)
  printf "DONT KNOW HOW TO GET TITLE FOR THIS URL: %s\n" "$1"
esac