Skip to content

Latest commit

 

History

History
301 lines (244 loc) · 16.7 KB

ubuntu.md

File metadata and controls

301 lines (244 loc) · 16.7 KB

阿里云ubuntu安装记录

机器配置:

root@iZwz9j36enzsqt8ab9tvkxZ:~# lsb_release -a
LSB Version:	core-9.20160110ubuntu0.2-amd64:core-9.20160110ubuntu0.2-noarch:security-9.20160110ubuntu0.2-amd64:security-9.20160110ubuntu0.2-noarch
Distributor ID:	Ubuntu
Description:	Ubuntu 16.04.2 LTS
Release:	16.04
Codename:	xenial

root@iZwz9j36enzsqt8ab9tvkxZ:~# free -h
              total        used        free      shared  buff/cache   available
Mem:           992M        280M         83M        3.1M        628M        534M
Swap:            0B          0B          0B
root@iZwz9j36enzsqt8ab9tvkxZ:~# df -h
Filesystem      Size  Used Avail Use% Mounted on
udev            479M     0  479M   0% /dev
tmpfs           100M  3.1M   97M   4% /run
/dev/vda1        40G  2.7G   35G   8% /
tmpfs           497M  124K  497M   1% /dev/shm
tmpfs           5.0M     0  5.0M   0% /run/lock
tmpfs           497M     0  497M   0% /sys/fs/cgroup
tmpfs           100M     0  100M   0% /run/user/0

Centos系统操作命令略有不同, 请将apt换成yum, 其他命令差异请自行解决.

以下是执行过程(全过程, 小白操作):

# 登录
ssh root@IP

# 更新安装git
apt update
apt install git

# 安装必要软件
apt install docker.io
apt install docker-compose

# 更新hosts, 复制主机名到hosts
cat /etc/hostname
vim /etc/hosts

>>>
0.0.0.0 iZwz9j36enzsqt8ab9tvkxZ
>>>

# 此后还要保证网络畅通, 提高ulimit的数量, 并且最好添加docker加速器

# scp go1.8压缩包到远程机器
# scp xxxx.tar.gz  ssh@IP:
# 安装golang1.8
# 最新: 直接获取go1.9
wget https://studygolang.com/dl/golang/go1.9.2.linux-amd64.tar.gz
tar -zxvf go1.9.2.linux-amd64.tar.gz
vim /etc/profile.d/myenv.sh

>>>>
export GOROOT=/root/go
export GOPATH=/root/gocode
export GOBIN=$GOPATH/bin
export PATH=.:$PATH:$GOROOT/bin:$GOBIN
:wq
>>>>

source /etc/profile.d/myenv.sh
go env

# 拉代码
mkdir -p ~/gocode/src/github.com/hunterhug
cd ~/gocode/src/github.com/hunterhug
git clone https://github.com/hunterhug/lizard


# 启动MYSQL和Redis
git clone https://github.com/hunterhug/GoSpider-docker
cd GoSpider-docker
chomd 777 build.sh
./build.sh

#  检测是否安装成功
docker ps
docker exec -it GoSpider-redis redis-cli -a 123456789
redis> keys *  (Ctrl+C)

docker exec -it GoSpider-mysqldb mysql -uroot -p123456789
mysql> show databases;
mysql> GRANT ALL PRIVILEGES ON *.* TO 'root'@'%'  IDENTIFIED BY '123456789'  WITH GRANT OPTION;
       flush privileges;
mysql> exit

# 编译爬虫端二进制
cd $GOPATH/src/github.com/hunterhug/lizard
chmod 777 build.sh
./build.sh

# 新建数据库
$GOPATH/src/github.com/hunterhug/lizard/spiders/usa/USQL
$GOPATH/src/github.com/hunterhug/lizard/spiders/jp/USQL
$GOPATH/src/github.com/hunterhug/lizard/spiders/de/USQL
$GOPATH/src/github.com/hunterhug/lizard/spiders/uk/USQL

docker exec -it GoSpider-mysqldb mysql -uroot -p123456789
mysql> show databases;
mysql> exit


# 方式一(推荐): 初始化数据库: 使用我抓取好的类目URL, 方式二见最后
cd $GOPATH/src/github.com/hunterhug/lizard/doc/sql
cp * /data/mydocker/mysql/conf/

# 类目已经更新了, 现在要导入这个(可能有更新的,请注意!!!)
cp days/usa_category20171026.sql /data/mydocker/mysql/conf/

docker exec -it  GoSpider-mysqldb mysql -uroot -p123456789

use jp_smart_base
source /etc/mysql/conf.d/jp_category.sql

use de_smart_base
source /etc/mysql/conf.d/de_category.sql

use smart_base
source /etc/mysql/conf.d/usa_category20171026.sql
#source /etc/mysql/conf.d/usa_category.sql

use uk_smart_base
source /etc/mysql/conf.d/uk_category.sql


# 设置定时器(cdddddddddd@qq.com请换为自己的用户名: 参见:https://proxy.mimvp.com)
crontab -e

>>>>
5 0 * * * ps -ef|grep usa/U* | awk '{print $2}' |xargs -i kill {}
20 0 * * * docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
10 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
15 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
20 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
0 3 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
5 0 * * * ps -ef|grep jp/U* | awk '{print $2}' |xargs -i kill {}
20 0 * * * docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
10 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
15 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
20 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
0 3 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
5 0 * * * ps -ef|grep uk/U* | awk '{print $2}' |xargs -i kill {}
20 0 * * * docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
10 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
15 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
20 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
0 3 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
5 0 * * * ps -ef|grep de/U* | awk '{print $2}' |xargs -i kill {}
20 0 * * * docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
10 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
15 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
20 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
0 3 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
*/1 * * * * curl http://127.0.0.1:12345/mi?orderid=cdddddddddd@qq.com\&user=jinhan\&password=459527502 > /dev/null 2>&1 &
*/1 * * * * curl http://127.0.0.1:12346/mi?orderid=cdddddddddd@qq.com\&user=jinhan\&password=459527502 > /dev/null 2>&1 &
*/1 * * * * curl http://127.0.0.1:12347/mi?orderid=cdddddddddd@qq.com\&user=jinhan\&password=459527502 > /dev/null 2>&1 &
*/1 * * * * curl http://127.0.0.1:12348/mi?orderid=cdddddddddd@qq.com\&user=jinhan\&password=459527502 > /dev/null 2>&1 &

:wq
>>>>

# 进行测试, 请逐条运行, 真的...

ps -ef|grep usa/U* | awk '{print $2}' |xargs -i kill {}
docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
ps -ef|grep jp/U* | awk '{print $2}' |xargs -i kill {}
docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/jp/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
ps -ef|grep uk/U* | awk '{print $2}' |xargs -i kill {}
docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/uk/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
ps -ef|grep de/U* | awk '{print $2}' |xargs -i kill {}
docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/de/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard > /dev/null 2>&1 &

# 看到有12345-12348的端口即可
netstat -ntpl

# 启动网站端

cd $GOPATH/src/github.com/hunterhug
git clone https://github.com/hunterhug/lizardWeb.git
cd lizardWeb
go build
./lizardWeb -s
nohup ./lizardWeb &
mkdir file
mkdir file/data
mkdir file/back
chmod 777 -R file

打开浏览器输入: /IP:80

# 第二天起就自动了


# 以下需要专业人员进行, 请勿操作(勿动)
# 接着特殊的: 方式二:初始化数据库(包括获取类目URL, 请耐心依次进行, 三个月一次)
# 需要先进数据库删除数据, 请逐行操作, (cdddddddddd@qq.com请换为自己的用户名: 参见:https://proxy.mimvp.com)
cd $GOPATH/src/github.com/hunterhug/lizard/tool/url/
curl "http://127.0.0.1:12345/mi?orderid=cdddddddddd@qq.com&user=jinhan&password=459527502"
curl "http://127.0.0.1:12346/mi?orderid=cdddddddddd@qq.com&user=jinhan&password=459527502"
curl "http://127.0.0.1:12347/mi?orderid=cdddddddddd@qq.com&user=jinhan&password=459527502"
curl "http://127.0.0.1:12348/mi?orderid=cdddddddddd@qq.com&user=jinhan&password=459527502"

docker exec -it GoSpider-mysqldb mysql -uroot -p123456789
>>>
use uk_smart_base
TRUNCATE  table smart_category
use de_smart_base
TRUNCATE  table smart_category
use jp_smart_base
TRUNCATE  table smart_category
use smart_base
TRUNCATE  table smart_category;
>>


# 如果出现很多错误,那你的代理不行, 请将toolproxy设置为false
go run usa_urlmain.go -toolproxy=false -toolstep=0
go run usa_urlmain.go -toolproxy=true -toolstep=1
go run usa_urlmain.go -toolproxy=true -toolstep=2
go run usa_urlmain.go -toolproxy=true -toolstep=3
go run usa_urlmain.go -toolproxy=true -toolstep=4
go run usa_urlparse.go

go run jp_urlmain.go -toolproxy=false -toolstep=0
go run jp_urlmain.go -toolproxy=true -toolstep=1
go run jp_urlmain.go -toolproxy=true -toolstep=2
go run jp_urlmain.go -toolproxy=true -toolstep=3
go run jp_urlmain.go -toolproxy=true -toolstep=4
go run jp_urlparse.go

go run uk_urlmain.go -toolproxy=false -toolstep=0
go run uk_urlmain.go -toolproxy=true -toolstep=1
go run uk_urlmain.go -toolproxy=true -toolstep=2
go run uk_urlmain.go -toolproxy=true -toolstep=3
go run uk_urlmain.go -toolproxy=true -toolstep=4
go run uk_urlparse.go

go run de_urlmain.go -toolproxy=false -toolstep=0
go run de_urlmain.go -toolproxy=true -toolstep=1
go run de_urlmain.go -toolproxy=true -toolstep=2
go run de_urlmain.go -toolproxy=true -toolstep=3
go run de_urlmain.go -toolproxy=true -toolstep=4
go run de_urlparse.go

mv /data/db/usa/url/index.md $GOPATH/src/github.com/hunterhug/lizard
# 导出数据给别人用
cd $GOPATH/src/github.com/hunterhug/lizard/doc/sql/days
docker exec -it GoSpider-mysqldb mysqldump -uroot -p123456789 smart_base smart_category>usa_category$(date +\%Y\%m\%d).sql;
docker exec -it GoSpider-mysqldb mysqldump -uroot -p123456789 de_smart_base smart_category>de_category$(date +\%Y\%m\%d).sql;
docker exec -it GoSpider-mysqldb mysqldump -uroot -p123456789 uk_smart_base smart_category>uk_category$(date +\%Y\%m\%d).sql;
docker exec -it GoSpider-mysqldb mysqldump -uroot -p123456789 jp_smart_base smart_category>jp_category$(date +\%Y\%m\%d).sql;

新品选款

支持https://www.amazon.com/gp/new-releases:

5 0 * * * ps -ef|grep usa/U* | awk '{print $2}' |xargs -i kill {}
20 0 * * * docker exec -d GoSpider-redis redis-cli -a 123456789 flushall
10 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
15 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
20 2 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
0 3 * * * nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
*/1 * * * * curl http://127.0.0.1:12345/mi?orderid=cdddddddddd@qq.com\&user=jinhan\&password=459527502 > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UURL -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UIP -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/ULIST -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &
nohup /root/gocode/src/github.com/hunterhug/lizard/spiders/usa/UASIN -core=/root/gocode/src/github.com/hunterhug/lizard/public/core -root=/root/gocode/src/github.com/hunterhug/lizard -toolnew=1 > /dev/null 2>&1 &