📄 getwww
字号:
#!/bin/shif [ "$1" = "" ]; then echo "Incorrect usage." 1>&2 exit 1fitouch data/visitedGOTIT=`grep -F "[$1]" data/visited`if [ ! "$GOTIT" = "" ]; then echo "[-] Already got $1." 1>&2 exit 0fiecho "[+] Trying to read $1..." 1>&2echo "[$1]" >>data/visited(sleep 40;killall -9 lynx ) &>/dev/null &lynx -connect_timeout=30 -source "$1" >.tmpwww 2>/dev/nullkillall -9 sleep &>/dev/nullif [ ! -s .tmpwww ]; then rm -f .tmpwww exit 0fi#cat .tmpwww >FIKU./htmlparser <.tmpwww >.tmpwww2#exit 1rm -f .tmpwww# Some minimal filteringgrep -E '{10,}[a-z0-9 ]' .tmpwww2 |grep -E '{4,}[A-z]' | sed 's/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/ / /g;s/^ //g;s/ &//g' >.tmpwwwrm -f .tmpwww2grep -E '^{2,}[a-z].*+[ ].*{2,}[a-z]$' .tmpwww >.tmpwww2rm -f .tmpwwwcat .tmpwww2 | grep -vE ' a$| the$| from$| to$| of$| and$ | or$| mr$| at$' | awk -F"^^OINK^^" '{print $0 " "}'rm -f .tmpwww2
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -