wrp/wrp.go

494 lines
13 KiB
Go
Raw Normal View History

2019-05-29 18:53:05 -07:00
//
// WRP - Web Rendering Proxy
//
// Copyright (c) 2013-2018 Antoni Sawicki
2020-04-23 03:27:16 -07:00
// Copyright (c) 2019-2020 Google LLC
2019-05-29 18:53:05 -07:00
//
2020-10-29 07:16:14 -07:00
//go:generate statik -f -src=. -include=wrp.html
2019-05-29 01:29:01 -07:00
package main
import (
"bytes"
2019-05-29 01:52:28 -07:00
"context"
"flag"
"fmt"
"html/template"
"image"
"image/gif"
"image/png"
2020-10-29 07:16:14 -07:00
"io/ioutil"
2019-05-29 01:52:28 -07:00
"log"
"math"
2019-05-30 02:03:17 -07:00
"math/rand"
2019-05-29 01:52:28 -07:00
"net/http"
"net/url"
2019-07-16 22:29:35 -07:00
"os"
"os/signal"
2019-05-29 01:52:28 -07:00
"strconv"
"strings"
2019-07-16 22:29:35 -07:00
"syscall"
2019-05-29 01:52:28 -07:00
"time"
2019-05-29 01:29:01 -07:00
2020-09-28 12:19:27 -07:00
"github.com/MaxHalford/halfgone"
2019-08-12 23:35:29 -07:00
"github.com/chromedp/cdproto/css"
2019-05-29 02:39:06 -07:00
"github.com/chromedp/cdproto/emulation"
"github.com/chromedp/cdproto/page"
2019-05-29 01:52:28 -07:00
"github.com/chromedp/chromedp"
"github.com/ericpauley/go-quantize/quantize"
2020-10-29 07:16:14 -07:00
"github.com/rakyll/statik/fs"
_ "github.com/tenox7/wrp/statik"
2019-05-29 01:29:01 -07:00
)
var (
version = "4.5"
srv http.Server
ctx context.Context
cancel context.CancelFunc
img = make(map[string]bytes.Buffer)
ismap = make(map[string]wrpReq)
2020-10-31 08:51:20 -07:00
noDel bool
defType string
defGeom geom
htmlTmpl *template.Template
2019-05-29 01:29:01 -07:00
)
type geom struct {
w int64
h int64
c int64
}
// Data for html template
type uiData struct {
Version string
URL string
2020-10-31 08:51:20 -07:00
BgColor string
NColors int64
Width int64
Height int64
Scale float64
ImgType string
2020-10-31 08:51:20 -07:00
ImgURL string
ImgSize string
ImgWidth int
ImgHeight int
2020-10-31 08:51:20 -07:00
MapURL string
PageHeight string
}
// Parameters for HTML print function
type printParams struct {
2020-10-31 08:51:20 -07:00
bgColor string
pageHeight string
imgSize string
imgURL string
mapURL string
imgWidth int
imgHeight int
}
2020-04-24 03:06:21 -07:00
// WRP Request
2019-07-10 23:58:40 -07:00
type wrpReq struct {
url string // url
width int64 // width
height int64 // height
scale float64 // scale
colors int64 // #colors
mouseX int64 // mouseX
mouseY int64 // mouseY
keys string // keys to send
buttons string // Fn buttons
imgType string // imgtype
out http.ResponseWriter
req *http.Request
2019-06-25 17:07:43 -07:00
}
2019-06-24 00:40:34 -07:00
2020-04-24 03:06:21 -07:00
// Parse HTML Form, Process Input Boxes, Etc.
func parseForm(w *wrpReq) {
w.req.ParseForm()
w.url = w.req.FormValue("url")
if len(w.url) > 1 && !strings.HasPrefix(w.url, "http") {
w.url = fmt.Sprintf("http://www.google.com/search?q=%s", url.QueryEscape(w.url))
2019-06-25 17:07:43 -07:00
}
w.width, _ = strconv.ParseInt(w.req.FormValue("w"), 10, 64)
w.height, _ = strconv.ParseInt(w.req.FormValue("h"), 10, 64)
if w.width < 10 && w.height < 10 {
2020-10-31 08:51:20 -07:00
w.width = defGeom.w
w.height = defGeom.h
2019-05-29 01:52:28 -07:00
}
w.scale, _ = strconv.ParseFloat(w.req.FormValue("s"), 64)
if w.scale < 0.1 {
w.scale = 1.0
2019-05-30 18:08:48 -07:00
}
w.colors, _ = strconv.ParseInt(w.req.FormValue("c"), 10, 64)
if w.colors < 2 || w.colors > 256 {
2020-10-31 08:51:20 -07:00
w.colors = defGeom.c
2019-06-02 17:06:41 -07:00
}
w.keys = w.req.FormValue("k")
w.buttons = w.req.FormValue("Fn")
w.imgType = w.req.FormValue("t")
if w.imgType != "gif" && w.imgType != "png" {
2020-10-31 08:51:20 -07:00
w.imgType = defType
2019-11-03 16:58:38 -08:00
}
log.Printf("%s WrpReq from UI Form: %+v\n", w.req.RemoteAddr, w)
2019-06-25 17:07:43 -07:00
}
2020-04-24 03:06:21 -07:00
// Display WP UI
func printHTML(w wrpReq, p printParams) {
w.out.Header().Set("Cache-Control", "max-age=0")
w.out.Header().Set("Expires", "-1")
w.out.Header().Set("Pragma", "no-cache")
w.out.Header().Set("Content-Type", "text/html")
data := uiData{
Version: version,
URL: w.url,
2020-10-31 08:51:20 -07:00
BgColor: p.bgColor,
Width: w.width,
Height: w.height,
NColors: w.colors,
Scale: w.scale,
ImgType: w.imgType,
2020-10-31 08:51:20 -07:00
ImgSize: p.imgSize,
ImgWidth: p.imgWidth,
ImgHeight: p.imgHeight,
ImgURL: p.imgURL,
MapURL: p.mapURL,
PageHeight: p.pageHeight,
2019-11-03 17:53:20 -08:00
}
err := htmlTmpl.Execute(w.out, data)
if err != nil {
log.Fatal(err)
2019-11-03 16:58:38 -08:00
}
2019-06-26 01:07:13 -07:00
}
2020-04-24 03:06:21 -07:00
// Process HTTP requests to WRP '/' url
2019-06-26 01:07:13 -07:00
func pageServer(out http.ResponseWriter, req *http.Request) {
log.Printf("%s Page Request for %s [%+v]\n", req.RemoteAddr, req.URL.Path, req.URL.RawQuery)
2019-07-10 23:58:40 -07:00
var w wrpReq
w.req = req
w.out = out
parseForm(&w)
2020-10-26 01:42:11 -07:00
if len(w.url) < 4 {
printHTML(w, printParams{bgColor: "#FFFFFF"})
2020-10-26 01:42:11 -07:00
return
2019-06-26 01:07:13 -07:00
}
navigate(w)
capture(w)
2019-06-26 01:07:13 -07:00
}
2020-04-24 03:06:21 -07:00
// Process HTTP requests to ISMAP '/map/' url
2019-06-26 01:07:13 -07:00
func mapServer(out http.ResponseWriter, req *http.Request) {
log.Printf("%s ISMAP Request for %s [%+v]\n", req.RemoteAddr, req.URL.Path, req.URL.RawQuery)
2019-07-10 23:58:40 -07:00
w, ok := ismap[req.URL.Path]
w.req = req
w.out = out
2019-06-26 01:07:13 -07:00
if !ok {
fmt.Fprintf(out, "Unable to find map %s\n", req.URL.Path)
log.Printf("Unable to find map %s\n", req.URL.Path)
return
}
2020-10-31 08:51:20 -07:00
if !noDel {
defer delete(ismap, req.URL.Path)
}
n, err := fmt.Sscanf(req.URL.RawQuery, "%d,%d", &w.mouseX, &w.mouseY)
2019-07-10 01:01:40 -07:00
if err != nil || n != 2 {
fmt.Fprintf(out, "n=%d, err=%s\n", n, err)
log.Printf("%s ISMAP n=%d, err=%s\n", req.RemoteAddr, n, err)
return
}
2019-07-10 23:58:40 -07:00
log.Printf("%s WrpReq from ISMAP: %+v\n", req.RemoteAddr, w)
2020-10-26 01:42:11 -07:00
if len(w.url) < 4 {
printHTML(w, printParams{bgColor: "#FFFFFF"})
2020-10-27 03:44:43 -07:00
return
2019-06-26 01:07:13 -07:00
}
navigate(w)
capture(w)
2019-05-29 01:29:01 -07:00
}
2020-04-24 03:06:21 -07:00
// Process HTTP requests for images '/img/' url
2019-05-29 01:29:01 -07:00
func imgServer(out http.ResponseWriter, req *http.Request) {
2019-05-31 18:20:55 -07:00
log.Printf("%s IMG Request for %s\n", req.RemoteAddr, req.URL.Path)
imgbuf, ok := img[req.URL.Path]
if !ok || imgbuf.Bytes() == nil {
2019-06-02 22:23:41 -07:00
fmt.Fprintf(out, "Unable to find image %s\n", req.URL.Path)
log.Printf("%s Unable to find image %s\n", req.RemoteAddr, req.URL.Path)
2019-06-02 22:23:41 -07:00
return
}
2020-10-31 08:51:20 -07:00
if !noDel {
defer delete(img, req.URL.Path)
}
2020-10-26 01:27:21 -07:00
switch {
case strings.HasPrefix(req.URL.Path, ".gif"):
out.Header().Set("Content-Type", "image/gif")
2020-10-26 01:27:21 -07:00
case strings.HasPrefix(req.URL.Path, ".png"):
out.Header().Set("Content-Type", "image/png")
}
out.Header().Set("Content-Length", strconv.Itoa(len(imgbuf.Bytes())))
2019-07-16 22:47:23 -07:00
out.Header().Set("Cache-Control", "max-age=0")
out.Header().Set("Expires", "-1")
out.Header().Set("Pragma", "no-cache")
out.Write(imgbuf.Bytes())
2019-05-30 02:03:17 -07:00
out.(http.Flusher).Flush()
2019-05-29 01:29:01 -07:00
}
2020-04-24 03:06:21 -07:00
// Process HTTP requests for Shutdown via '/shutdown/' url
func haltServer(out http.ResponseWriter, req *http.Request) {
log.Printf("%s Shutdown Request for %s\n", req.RemoteAddr, req.URL.Path)
out.Header().Set("Cache-Control", "max-age=0")
out.Header().Set("Expires", "-1")
out.Header().Set("Pragma", "no-cache")
out.Header().Set("Content-Type", "text/plain")
fmt.Fprintf(out, "Shutting down WRP...\n")
out.(http.Flusher).Flush()
time.Sleep(time.Second * 2)
cancel()
srv.Shutdown(context.Background())
os.Exit(1)
}
2020-10-26 01:21:42 -07:00
// Determine what action to take
func action(w wrpReq) chromedp.Action {
2020-04-24 03:09:20 -07:00
// Mouse Click
if w.mouseX > 0 && w.mouseY > 0 {
log.Printf("%s Mouse Click %d,%d\n", w.req.RemoteAddr, w.mouseX, w.mouseY)
2020-10-26 01:21:42 -07:00
return chromedp.MouseClickXY(float64(w.mouseX)/float64(w.scale), float64(w.mouseY)/float64(w.scale))
}
// Buttons
if len(w.buttons) > 0 {
log.Printf("%s Button %v\n", w.req.RemoteAddr, w.buttons)
switch w.buttons {
case "Bk":
2020-10-26 01:21:42 -07:00
return chromedp.NavigateBack()
case "Bs":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\b")
case "Rt":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\r")
case "<":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\u0302")
case "^":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\u0304")
case "v":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\u0301")
case ">":
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent("\u0303")
}
2020-10-26 01:21:42 -07:00
}
// Keys
if len(w.keys) > 0 {
log.Printf("%s Sending Keys: %#v\n", w.req.RemoteAddr, w.keys)
2020-10-26 01:21:42 -07:00
return chromedp.KeyEvent(w.keys)
2019-07-10 01:01:40 -07:00
}
2020-10-26 01:21:42 -07:00
// Navigate to URL
log.Printf("%s Processing Capture Request for %s\n", w.req.RemoteAddr, w.url)
return chromedp.Navigate(w.url)
}
// Process Keyboard and Mouse events or Navigate to the desired URL.
func navigate(w wrpReq) {
err := chromedp.Run(ctx, action(w))
2019-05-31 00:41:46 -07:00
if err != nil {
if err.Error() == "context canceled" {
log.Printf("%s Contex cancelled, try again", w.req.RemoteAddr)
fmt.Fprintf(w.out, "<BR>%s<BR> -- restarting, try again", err)
ctx, cancel = chromedp.NewContext(context.Background())
2020-10-26 01:21:42 -07:00
return
}
2020-10-26 01:21:42 -07:00
log.Printf("%s %s", w.req.RemoteAddr, err)
fmt.Fprintf(w.out, "<BR>%s<BR>", err)
2019-05-31 00:41:46 -07:00
}
2020-04-24 02:45:34 -07:00
}
2020-04-24 03:06:21 -07:00
// Capture currently rendered web page to an image and fake ISMAP
func capture(w wrpReq) {
2020-04-24 02:45:34 -07:00
var err error
2020-04-23 03:25:39 -07:00
var styles []*css.ComputedStyleProperty
var r, g, b int
var h int64
var pngcap []byte
2019-08-12 23:35:29 -07:00
chromedp.Run(ctx,
emulation.SetDeviceMetricsOverride(int64(float64(w.width)/w.scale), 10, w.scale, false),
chromedp.Location(&w.url),
chromedp.ComputedStyle("body", &styles, chromedp.ByQuery),
chromedp.ActionFunc(func(ctx context.Context) error {
_, _, s, err := page.GetLayoutMetrics().Do(ctx)
if err == nil {
h = int64(math.Ceil(s.Height))
}
return nil
}),
)
2019-08-12 23:35:29 -07:00
for _, style := range styles {
if style.Name == "background-color" {
fmt.Sscanf(style.Value, "rgb(%d,%d,%d)", &r, &g, &b)
}
}
log.Printf("%s Landed on: %s, Height: %v\n", w.req.RemoteAddr, w.url, h)
2020-10-26 01:49:03 -07:00
height := int64(float64(w.height) / w.scale)
if w.height == 0 && h > 0 {
2020-10-26 01:49:03 -07:00
height = h + 30
}
2020-10-26 01:49:03 -07:00
chromedp.Run(ctx, emulation.SetDeviceMetricsOverride(int64(float64(w.width)/w.scale), height, w.scale, false))
// Capture screenshot...
err = chromedp.Run(ctx,
2020-10-27 04:39:14 -07:00
chromedp.Sleep(time.Second*2),
chromedp.CaptureScreenshot(&pngcap),
)
2019-06-24 00:40:34 -07:00
if err != nil {
if err.Error() == "context canceled" {
log.Printf("%s Contex cancelled, try again", w.req.RemoteAddr)
fmt.Fprintf(w.out, "<BR>%s<BR> -- restarting, try again", err)
ctx, cancel = chromedp.NewContext(context.Background())
2020-10-26 01:21:42 -07:00
return
}
2020-10-26 01:21:42 -07:00
log.Printf("%s Failed to capture screenshot: %s\n", w.req.RemoteAddr, err)
fmt.Fprintf(w.out, "<BR>Unable to capture screenshot:<BR>%s<BR>\n", err)
2019-06-24 00:40:34 -07:00
return
}
2019-06-26 01:07:13 -07:00
seq := rand.Intn(9999)
imgpath := fmt.Sprintf("/img/%04d.%s", seq, w.imgType)
2019-06-26 01:07:13 -07:00
mappath := fmt.Sprintf("/map/%04d.map", seq)
2019-07-10 23:58:40 -07:00
ismap[mappath] = w
var ssize string
var iw, ih int
2020-10-26 01:32:09 -07:00
switch w.imgType {
case "gif":
i, err := png.Decode(bytes.NewReader(pngcap))
if err != nil {
log.Printf("%s Failed to decode screenshot: %s\n", w.req.RemoteAddr, err)
fmt.Fprintf(w.out, "<BR>Unable to decode page screenshot:<BR>%s<BR>\n", err)
return
}
2020-09-28 12:19:27 -07:00
if w.colors == 2 {
gray := halfgone.ImageToGray(i)
i = halfgone.FloydSteinbergDitherer{}.Apply(gray)
}
var gifbuf bytes.Buffer
err = gif.Encode(&gifbuf, i, &gif.Options{NumColors: int(w.colors), Quantizer: quantize.MedianCutQuantizer{}})
if err != nil {
log.Printf("%s Failed to encode GIF: %s\n", w.req.RemoteAddr, err)
fmt.Fprintf(w.out, "<BR>Unable to encode GIF:<BR>%s<BR>\n", err)
return
}
img[imgpath] = gifbuf
2020-04-26 01:25:28 -07:00
ssize = fmt.Sprintf("%.0f KB", float32(len(gifbuf.Bytes()))/1024.0)
iw = i.Bounds().Max.X
ih = i.Bounds().Max.Y
log.Printf("%s Encoded GIF image: %s, Size: %s, Colors: %d, %dx%d\n", w.req.RemoteAddr, imgpath, ssize, w.colors, iw, ih)
2020-10-26 01:32:09 -07:00
case "png":
pngbuf := bytes.NewBuffer(pngcap)
img[imgpath] = *pngbuf
cfg, _, _ := image.DecodeConfig(pngbuf)
2020-04-26 01:25:28 -07:00
ssize = fmt.Sprintf("%.0f KB", float32(len(pngbuf.Bytes()))/1024.0)
iw = cfg.Width
ih = cfg.Height
log.Printf("%s Got PNG image: %s, Size: %s, %dx%d\n", w.req.RemoteAddr, imgpath, ssize, iw, ih)
}
printHTML(w, printParams{
2020-10-31 08:51:20 -07:00
bgColor: fmt.Sprintf("#%02X%02X%02X", r, g, b),
pageHeight: fmt.Sprintf("%d PX", h),
imgSize: ssize,
imgURL: imgpath,
mapURL: mappath,
imgWidth: iw,
imgHeight: ih,
})
log.Printf("%s Done with capture for %s\n", w.req.RemoteAddr, w.url)
2019-05-29 01:29:01 -07:00
}
// returns html template, either from html file or built-in
2020-10-29 07:16:14 -07:00
func tmpl(t string) string {
var tmpl []byte
fh, err := os.Open(t)
if err != nil {
goto statik
}
tmpl, err = ioutil.ReadAll(fh)
if err != nil {
goto statik
}
log.Printf("Got UI template from %v file\n", t)
return string(tmpl)
statik:
sfs, err := fs.New()
if err != nil {
log.Fatal(err)
}
fhs, err := sfs.Open("/wrp.html")
if err != nil {
log.Fatal(err)
}
tmpl, err = ioutil.ReadAll(fhs)
if err != nil {
log.Fatal(err)
}
log.Printf("Got UI template from built-in\n")
return string(tmpl)
}
2020-04-24 03:06:21 -07:00
// Main...
2019-05-29 01:29:01 -07:00
func main() {
2020-10-29 07:16:14 -07:00
var addr, fgeom, tHtml string
var headless bool
var debug bool
var err error
2019-05-29 01:52:28 -07:00
flag.StringVar(&addr, "l", ":8080", "Listen address:port, default :8080")
flag.BoolVar(&headless, "h", true, "Headless mode - hide browser window")
flag.BoolVar(&debug, "d", false, "Debug ChromeDP")
2020-10-31 08:51:20 -07:00
flag.BoolVar(&noDel, "n", false, "Do not free maps and images after use")
flag.StringVar(&defType, "t", "gif", "Image type: gif|png")
flag.StringVar(&fgeom, "g", "1152x600x256", "Geometry: width x height x colors, height can be 0 for unlimited")
2020-10-29 07:16:14 -07:00
flag.StringVar(&tHtml, "ui", "wrp.html", "HTML template file for the UI")
2019-05-29 01:52:28 -07:00
flag.Parse()
if len(os.Getenv("PORT")) > 0 {
addr = ":" + os.Getenv(("PORT"))
}
2020-10-31 08:51:20 -07:00
n, err := fmt.Sscanf(fgeom, "%dx%dx%d", &defGeom.w, &defGeom.h, &defGeom.c)
if err != nil || n != 3 {
log.Fatalf("Unable to parse -g geometry flag / %s", err)
}
opts := append(chromedp.DefaultExecAllocatorOptions[:],
chromedp.Flag("headless", headless),
2019-07-10 23:58:40 -07:00
chromedp.Flag("hide-scrollbars", false),
)
2019-07-16 22:29:35 -07:00
actx, acancel := chromedp.NewExecAllocator(context.Background(), opts...)
defer acancel()
if debug {
2019-06-04 01:23:46 -07:00
ctx, cancel = chromedp.NewContext(actx, chromedp.WithDebugf(log.Printf))
} else {
2019-06-04 01:23:46 -07:00
ctx, cancel = chromedp.NewContext(actx)
}
defer cancel()
2019-05-30 02:03:17 -07:00
rand.Seed(time.Now().UnixNano())
2019-07-16 22:29:35 -07:00
c := make(chan os.Signal)
signal.Notify(c, os.Interrupt, syscall.SIGTERM)
go func() {
<-c
log.Printf("Interrupt - shutting down.")
cancel()
srv.Shutdown(context.Background())
os.Exit(1)
}()
2019-05-29 01:52:28 -07:00
http.HandleFunc("/", pageServer)
2019-06-26 01:07:13 -07:00
http.HandleFunc("/map/", mapServer)
2019-05-30 02:03:17 -07:00
http.HandleFunc("/img/", imgServer)
2019-06-17 23:53:22 -07:00
http.HandleFunc("/shutdown/", haltServer)
2019-05-29 18:47:03 -07:00
http.HandleFunc("/favicon.ico", http.NotFound)
2019-06-02 16:24:46 -07:00
log.Printf("Web Rendering Proxy Version %s\n", version)
2020-04-27 12:29:18 -07:00
log.Printf("Args: %q", os.Args)
2020-10-31 08:51:20 -07:00
log.Printf("Default Img Type: %v, Geometry: %+v", defType, defGeom)
2020-10-29 07:16:14 -07:00
htmlTmpl, err = template.New("wrp.html").Parse(tmpl(tHtml))
if err != nil {
log.Fatal(err)
}
2019-05-30 23:40:43 -07:00
log.Printf("Starting WRP http server on %s\n", addr)
2019-06-17 23:53:22 -07:00
srv.Addr = addr
err = srv.ListenAndServe()
2019-06-17 23:53:22 -07:00
if err != nil {
log.Fatal(err)
}
2019-05-29 01:29:01 -07:00
}