-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.go
164 lines (141 loc) · 3.39 KB
/
main.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
package main
import (
"fmt"
"github.com/PuerkitoBio/goquery"
"io/ioutil"
"net/http"
"os"
"strings"
"sync"
)
//var Urls = [...]string{
// //"http://www.weijin365.com/",
// "http://www.wanxuechuang.com/",
//}
var FileName = "D:/goProject/src/website/麦穗教育"
var WebUrl = "http://www.maisuimx.com"
var rwlock sync.RWMutex // 全局读写锁 rwlock
func main() {
//for _, url := range Urls {
//}
var url = WebUrl
resp, err := http.Get(url)
parseHtml(url,1)
if err != nil {
fmt.Println(err)
return
}
defer resp.Body.Close()
body, err := ioutil.ReadAll(resp.Body)
//fmt.Println(string(body))
if resp.StatusCode == 200 {
fmt.Println("请求成功")
fname := "/html/index.html"
CreateMutiDir(FileName +fname)
f, err := os.OpenFile(FileName +fname, os.O_CREATE|os.O_RDWR, os.ModePerm)
if err != nil {
fmt.Println(err.Error())
}
f.Write(body)
f.Close()
}
}
func parseHtml(url string, mod int){
doc, err := goquery.NewDocument(url)
if mod == 1 {
if err != nil {
fmt.Println(err.Error())
}
s := doc.Find("script")
s.Each(func(i int, content *goquery.Selection) {
url,_ := content .Attr("src")
fmt.Println(url)
riteData(url)
})
l := doc.Find("link")
l.Each(func(i int,content *goquery.Selection) {
url,_ := content.Attr("href")
fmt.Println(url)
riteData(url)
})
i := doc.Find("img")
i.Each(func(i int,content *goquery.Selection) {
url,_ := content.Attr("src")
fmt.Println(url)
riteData(url)
})
a := doc.Find("a")
a.Each(func(i int,content *goquery.Selection) {
url,_ := content.Attr("href")
fmt.Println(url)
riteData(url)
})
} else {
i := doc.Find("img")
i.Each(func(i int,content *goquery.Selection) {
url,_ := content.Attr("src")
fmt.Println(url)
riteData(url)
})
}
}
func riteData(url string){
body := DoGet(WebUrl+url)
if body == nil {
return
}
//fmt.Println(string(body))
var file string
file = FileName
fname := file + url
CreateMutiDir(fname)
if !strings.Contains(fname,"."){
fname += "index.html"
parseHtml(WebUrl+url,2)
}
f, err := os.OpenFile(fname, os.O_CREATE|os.O_RDWR, 0666)
if err != nil {
fmt.Println(err.Error())
}
f.Write(body)
f.Close()
}
func CreateMutiDir(filePath string) error {
filePath = filePath[0:strings.LastIndex(filePath,"/")+1]
if !isExist(filePath) {
err := os.MkdirAll(filePath, os.ModePerm)
if err != nil {
fmt.Println("创建文件夹失败,error info:", err)
return err
}
return err
}
return nil
}
// 判断所给路径文件/文件夹是否存在(返回true是存在)
func isExist(path string) bool {
_, err := os.Stat(path) //os.Stat获取文件信息
if err != nil {
if os.IsExist(err) {
return true
}
return false
}
return true
}
func DoGet(url string) []byte{
client := &http.Client{}
req,_ := http.NewRequest("GET",url,nil)
req.Header.Add("X-AUTH-TOKEN","eyJhbGciOiJIUzI1NiJ9.eyJqdGkiOiIxNTc3ODI1MDI1NSIsInN1YiI6IjE1Nzc4MjUwMjU1IiwiaWF0IjoxNjA4MzUwMjQ2fQ.8pS7nUx4P6mcf0LXIATIgmQt_5F2OKI370T6-uqknEc")
req.Header.Add("User-Agent","Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.88 Safari/537.36")
req.Header.Add("Content-Type","application/json;charset=UTF-8")
resp,_ := client.Do(req)
if resp != nil && resp.StatusCode == 200 {
fmt.Println("请求成功")
body, _ := ioutil.ReadAll(resp.Body)
return body
} else {
fmt.Println("请求失败")
}
return nil
}