piEsposito · February 14, 2020 13:16
diff --git a/webmotors_crawl_funcs.go b/webmotors_crawl_funcs.go
 package crawl_functions

 import (
 	"fmt"
 	"sync"
 	"webmotor_crawler/query_handler"
 )

 func CrawlRoutine(wg *sync.WaitGroup, c chan int) {
 	/*
 		This is our crawl routine function. It creates a client and request by taking info from the channel
 		We use independent objects to have no blocking on our code execution
 	*/
 	head := query_handler.QueryClient{
 		Accept:                    "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
 		Accept_encoding:           "gzip, deflate, br",
 		Accept_language:           "en-US,en;q=0.5",
 		Connection:                "keep-alive",
 		Host:                      "www.webmotors.com.br",
 		TE:                        "Trailers",
 		Upgrade_insecure_requests: "1",
 		User_agent:                "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:72.0) Gecko/20100101 Firefox/72.0",
 		ProxyUrl:                  "socks5://96.44.133.110:58690",
 	}

 	client := head.GenerateNoProxiedClient()
 	//wg.Add(1)

 	for len(c) > 0 {
 		//Perform the crawl operations as long as the channel is populated
 		link, path := CreateLink(<-c)
 		fmt.Println(link)
 		req := head.CreateRequest(link)
 		resp, _ := client.Do(req)
 		result := query_handler.ConvertGzipToString(resp)

 		query_handler.SaveJsonString(result, path)

 	}

 	wg.Done()
 }
	package crawl_functions

	import (
	"fmt"
	"sync"
	"webmotor_crawler/query_handler"
	)

	func CrawlRoutine(wg *sync.WaitGroup, c chan int) {
	/*
	This is our crawl routine function. It creates a client and request by taking info from the channel
	We use independent objects to have no blocking on our code execution
	*/
	head := query_handler.QueryClient{
	Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,/;q=0.8",
	Accept_encoding: "gzip, deflate, br",
	Accept_language: "en-US,en;q=0.5",
	Connection: "keep-alive",
	Host: "www.webmotors.com.br",
	TE: "Trailers",
	Upgrade_insecure_requests: "1",
	User_agent: "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:72.0) Gecko/20100101 Firefox/72.0",
	ProxyUrl: "socks5://96.44.133.110:58690",
	}

	client := head.GenerateNoProxiedClient()
	//wg.Add(1)

	for len(c) > 0 {
	//Perform the crawl operations as long as the channel is populated
	link, path := CreateLink(<-c)
	fmt.Println(link)
	req := head.CreateRequest(link)
	resp, _ := client.Do(req)
	result := query_handler.ConvertGzipToString(resp)

	query_handler.SaveJsonString(result, path)

	}

	wg.Done()
	}