webtoon-dl-gif-support/main.go

117 lines
2.7 KiB
Go
Raw Normal View History

2023-12-20 10:33:51 -08:00
package main
import (
2023-12-21 08:38:48 -08:00
"bytes"
2023-12-20 10:33:51 -08:00
"fmt"
"github.com/anaskhan96/soup"
2023-12-21 08:38:48 -08:00
"github.com/signintech/gopdf"
"image"
"io"
"net/http"
2023-12-20 10:33:51 -08:00
"os"
2023-12-21 09:20:50 -08:00
"strings"
2023-12-20 10:33:51 -08:00
)
2023-12-21 09:20:50 -08:00
func getImgLinks(url string) []string {
resp, err := soup.Get(url)
if err != nil {
fmt.Println(fmt.Sprintf("Error fetching page: %v", err))
os.Exit(1)
}
doc := soup.HTMLParse(resp)
imgs := doc.Find("div", "class", "viewer_lst").FindAll("img")
var imgLinks []string
for _, img := range imgs {
imgLinks = append(imgLinks, img.Attrs()["data-url"])
}
return imgLinks
}
2023-12-21 08:38:48 -08:00
func fetchImage(imgLink string) []byte {
req, e := http.NewRequest("GET", imgLink, nil)
if e != nil {
fmt.Println(e)
os.Exit(1)
}
req.Header.Set("Referer", "http://www.webtoons.com")
response, err := http.DefaultClient.Do(req)
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
defer func(Body io.ReadCloser) {
err := Body.Close()
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
}(response.Body)
buff := new(bytes.Buffer)
_, err = buff.ReadFrom(response.Body)
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
return buff.Bytes()
}
2023-12-20 10:33:51 -08:00
func main() {
2023-12-21 09:20:50 -08:00
if len(os.Args) < 2 {
fmt.Println("Usage: webtoon-dl <url>")
2023-12-20 10:33:51 -08:00
os.Exit(1)
}
2023-12-21 09:20:50 -08:00
url := os.Args[1]
imgLinks := getImgLinks(url)
fmt.Println(fmt.Sprintf("found %d pages", len(imgLinks)))
2023-12-21 08:38:48 -08:00
pdf := gopdf.GoPdf{}
pdf.Start(gopdf.Config{Unit: gopdf.UnitPT, PageSize: *gopdf.PageSizeA4})
for _, imgLink := range imgLinks {
fmt.Println(imgLink)
img := fetchImage(imgLink)
holder, err := gopdf.ImageHolderByBytes(img)
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
d, _, err := image.DecodeConfig(bytes.NewReader(img))
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
// gopdf assumes dpi 128 https://github.com/signintech/gopdf/issues/168
// W and H are in points, 1 point = 1/72 inch
2023-12-21 09:20:50 -08:00
// convert pixels (Width and Height) to points
// subtract 1 point to account for margins
2023-12-21 08:38:48 -08:00
pdf.AddPageWithOption(gopdf.PageOption{PageSize: &gopdf.Rect{
W: float64(d.Width)*72/128 - 1,
H: float64(d.Height)*72/128 - 1,
}})
err = pdf.ImageByHolder(holder, 0, 0, nil)
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
}
2023-12-21 09:20:50 -08:00
outURL := strings.ReplaceAll(url, "http://", "")
outURL = strings.ReplaceAll(outURL, "https://", "")
outURL = strings.ReplaceAll(outURL, "www.", "")
outURL = strings.ReplaceAll(outURL, "webtoons.com/", "")
outURL = strings.Split(outURL, "?")[0]
outURL = strings.ReplaceAll(outURL, "/viewer", "")
outURL = strings.ReplaceAll(outURL, string(os.PathSeparator), "-")
outPath := "./" + outURL + ".pdf"
err := pdf.WritePdf(outPath)
2023-12-21 08:38:48 -08:00
if err != nil {
2023-12-21 09:20:50 -08:00
fmt.Println(err.Error())
os.Exit(1)
2023-12-21 08:38:48 -08:00
}
2023-12-21 09:20:50 -08:00
fmt.Println(fmt.Sprintf("saved to %s", outPath))
2023-12-20 10:33:51 -08:00
}