-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.go
More file actions
91 lines (72 loc) · 1.47 KB
/
main.go
File metadata and controls
91 lines (72 loc) · 1.47 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
package main
import (
"flag"
"fmt"
"my-http/httphelper"
"my-http/worker"
"net/http"
neturl "net/url"
"os"
"os/signal"
"syscall"
)
var (
parallel = flag.Int("parallel", 10, "the numbers of parallel request")
dispatcher *worker.Dispatcher
)
type webScrapper struct {
client *http.Client
}
func (ws *webScrapper) PullContent(url string) (string, error) {
var md5String string
md5String, err := httphelper.Get(url, ws.client)
if err != nil {
return "", err
}
return md5String, nil
}
func init() {
flag.Parse()
}
func main() {
if len(os.Args) == 1 {
flag.Usage()
os.Exit(1)
}
stop := make(chan os.Signal, 1)
signal.Notify(stop, syscall.SIGINT, syscall.SIGQUIT)
//Init processReqDispatcher
dispatcher = worker.Init(200, *parallel)
processRequests()
<-stop
dispatcher.Stop()
fmt.Println("Shutdown Process ...")
}
func processRequests() {
urls := flag.Args()
for _, url := range urls {
u, err := neturl.Parse(url)
if err != nil {
fmt.Printf("Error: %v\n", err)
}
if u.Scheme == "" {
u.Scheme = "http"
}
dispatcher.AddJob(worker.Job{
Payload: u.String(),
Handler: handleRequest(),
})
}
}
var handleRequest = func() worker.Handler {
return func(url interface{}) (interface{}, error) {
client := httphelper.CustomClient()
scrapper := webScrapper{client: client}
md5String, err := scrapper.PullContent(fmt.Sprintf("%v", url))
if err != nil {
return "", err
}
fmt.Printf("%v %v \n", url, md5String)
return url, nil
}
}