goop/internal/workers/download.go

66 lines
1.5 KiB
Go
Raw Normal View History

package workers
import (
"fmt"
"github.com/deletescape/goop/internal/utils"
"github.com/valyala/fasthttp"
"io/ioutil"
"os"
"sync"
2020-11-24 08:00:07 +00:00
"time"
)
2020-11-24 08:00:07 +00:00
func DownloadWorker(c *fasthttp.Client, queue chan string, baseUrl, baseDir string, wg *sync.WaitGroup, allowHtml bool) {
defer wg.Done()
2020-11-24 08:00:07 +00:00
var ctr int
for {
select {
case file := <-queue:
checkRatelimted()
if file == "" {
continue
}
2020-11-24 08:00:07 +00:00
targetFile := utils.Url(baseDir, file)
if utils.Exists(targetFile) {
fmt.Printf("%s was downloaded already, skipping\n", targetFile)
continue
}
2020-11-24 08:00:07 +00:00
uri := utils.Url(baseUrl, file)
code, body, err := c.Get(nil, uri)
fmt.Printf("[-] Fetching %s [%d]\n", uri, code)
if err != nil {
fmt.Fprintf(os.Stderr, "error: %s\n", err)
continue
}
2020-11-24 08:00:07 +00:00
if code == 200 {
if !allowHtml && utils.IsHtml(body) {
fmt.Printf("warning: %s appears to be an html file, skipping\n", uri)
continue
}
if utils.IsEmptyBytes(body) {
fmt.Printf("warning: %s appears to be an empty file, skipping\n", uri)
continue
}
if err := utils.CreateParentFolders(targetFile); err != nil {
fmt.Fprintf(os.Stderr, "error: %s\n", err)
continue
}
if err := ioutil.WriteFile(targetFile, body, os.ModePerm); err != nil {
fmt.Fprintf(os.Stderr, "error: %s\n", err)
}
} else if code == 429 {
setRatelimited()
queue <- file
}
default:
// TODO: get rid of dirty hack somehow
if ctr >= graceTimes {
return
}
2020-11-24 08:00:07 +00:00
ctr++
time.Sleep(gracePeriod)
}
}
}