wrp/wrp.go

310 lines
7.4 KiB
Go
Raw Normal View History

2019-05-29 18:53:05 -07:00
//
// WRP - Web Rendering Proxy
//
2024-05-23 00:34:00 -07:00
// Copyright (c) 2013-2024 Antoni Sawicki
2024-01-02 02:09:38 -08:00
// Copyright (c) 2019-2024 Google LLC
2019-05-29 18:53:05 -07:00
//
2019-05-29 01:29:01 -07:00
package main
import (
"bytes"
2019-05-29 01:52:28 -07:00
"context"
2022-03-17 02:27:34 +00:00
"embed"
2019-05-29 01:52:28 -07:00
"flag"
"fmt"
"io"
2019-05-29 01:52:28 -07:00
"log"
"net/http"
"net/url"
2019-07-16 22:29:35 -07:00
"os"
"os/signal"
2024-05-23 00:34:00 -07:00
"runtime"
2019-05-29 01:52:28 -07:00
"strconv"
"strings"
2019-07-16 22:29:35 -07:00
"syscall"
2024-06-19 23:37:44 -07:00
"text/template"
2019-05-29 01:52:28 -07:00
"time"
2019-05-29 01:29:01 -07:00
)
2024-07-03 05:24:56 -07:00
const version = "4.8.0"
var (
addr = flag.String("l", ":8080", "Listen address:port, default :8080")
headless = flag.Bool("h", true, "Headless mode / hide browser window (default true)")
noDel = flag.Bool("n", false, "Do not free maps and images after use")
defType = flag.String("t", "gif", "Image type: png|gif|jpg")
wrpMode = flag.String("m", "ismap", "WRP Mode: ismap|html")
defImgSize = flag.Int64("is", 200, "html mode default image size")
jpgQual = flag.Int("q", 75, "Jpeg image quality, default 75%") // TODO: this should be form dropdown when jpeg is selected as image type
fgeom = flag.String("g", "1152x600x216", "Geometry: width x height x colors, height can be 0 for unlimited")
htmFnam = flag.String("ui", "wrp.html", "HTML template file for the UI")
delay = flag.Duration("s", 2*time.Second, "Delay/sleep after page is rendered and before screenshot is taken")
userAgent = flag.String("ua", "", "override chrome user agent")
)
2022-12-07 23:44:09 -08:00
2019-05-29 01:29:01 -07:00
var (
srv http.Server
actx, ctx context.Context
acncl, cncl context.CancelFunc
img = make(map[string]bytes.Buffer)
ismap = make(map[string]wrpReq)
defGeom geom
htmlTmpl *template.Template
2019-05-29 01:29:01 -07:00
)
2022-11-30 02:00:53 -08:00
//go:embed *.html
2022-03-17 02:27:34 +00:00
var fs embed.FS
type geom struct {
w int64
h int64
c int64
}
2024-07-08 21:27:51 -07:00
// TODO: there is a major overlap/duplication/triplication
// between the 3 data structs, perhps we could reduce to just one?
// Data for html template
type uiData struct {
Version string
2024-07-03 05:24:56 -07:00
WrpMode string
URL string
2020-10-31 08:51:20 -07:00
BgColor string
NColors int64
Width int64
Height int64
2021-03-08 05:02:22 -08:00
Zoom float64
ImgType string
2020-10-31 08:51:20 -07:00
ImgURL string
ImgSize string
ImgWidth int
ImgHeight int
2024-07-03 05:24:56 -07:00
MaxSize int64
2020-10-31 08:51:20 -07:00
MapURL string
PageHeight string
2024-06-19 23:37:44 -07:00
TeXT string
}
// Parameters for HTML print function
2024-07-08 21:36:32 -07:00
type uiParams struct {
2020-10-31 08:51:20 -07:00
bgColor string
pageHeight string
imgSize string
imgURL string
mapURL string
imgWidth int
imgHeight int
2024-06-19 23:37:44 -07:00
text string
}
2020-04-24 03:06:21 -07:00
// WRP Request
2019-07-10 23:58:40 -07:00
type wrpReq struct {
url string // url
width int64 // width
height int64 // height
2021-03-08 05:02:22 -08:00
zoom float64 // zoom/scale
colors int64 // #colors
mouseX int64 // mouseX
mouseY int64 // mouseY
keys string // keys to send
buttons string // Fn buttons
imgType string // imgtype
2024-07-03 05:24:56 -07:00
wrpMode string // mode ismap/html
maxSize int64 // image max size for html mode
imgOpt int64
2022-11-06 01:11:49 -08:00
w http.ResponseWriter
r *http.Request
2019-06-25 17:07:43 -07:00
}
2019-06-24 00:40:34 -07:00
func (rq *wrpReq) parseForm() {
2022-11-06 01:11:49 -08:00
rq.r.ParseForm()
2024-07-03 05:24:56 -07:00
rq.wrpMode = rq.r.FormValue("m")
if rq.wrpMode == "" {
rq.wrpMode = *wrpMode
}
2022-11-06 01:11:49 -08:00
rq.url = rq.r.FormValue("url")
if len(rq.url) > 1 && !strings.HasPrefix(rq.url, "http") {
rq.url = fmt.Sprintf("http://www.google.com/search?q=%s", url.QueryEscape(rq.url))
2019-06-25 17:07:43 -07:00
}
2024-07-03 05:24:56 -07:00
// TODO: implement atoiOrZero
2022-11-06 01:11:49 -08:00
rq.width, _ = strconv.ParseInt(rq.r.FormValue("w"), 10, 64)
rq.height, _ = strconv.ParseInt(rq.r.FormValue("h"), 10, 64)
if rq.width < 10 && rq.height < 10 {
rq.width = defGeom.w
rq.height = defGeom.h
2019-05-29 01:52:28 -07:00
}
2022-11-06 01:11:49 -08:00
rq.zoom, _ = strconv.ParseFloat(rq.r.FormValue("z"), 64)
if rq.zoom < 0.1 {
rq.zoom = 1.0
2019-05-30 18:08:48 -07:00
}
2024-07-03 05:24:56 -07:00
rq.colors, _ = strconv.ParseInt(rq.r.FormValue("c"), 10, 64) // TODO: this needs to be jpeg quality as well
if rq.colors < 2 || rq.colors > 256 { // ... but maybe not because of this?
rq.colors = defGeom.c
2019-06-02 17:06:41 -07:00
}
2022-11-06 01:11:49 -08:00
rq.keys = rq.r.FormValue("k")
rq.buttons = rq.r.FormValue("Fn")
2024-07-03 05:24:56 -07:00
rq.maxSize, _ = strconv.ParseInt(rq.r.FormValue("s"), 10, 64)
if rq.maxSize == 0 {
rq.maxSize = *defImgSize
}
2022-11-06 01:11:49 -08:00
rq.imgType = rq.r.FormValue("t")
2022-12-08 00:55:56 -08:00
switch rq.imgType {
case "png":
case "gif":
2024-07-03 05:24:56 -07:00
rq.imgOpt = defGeom.c
2022-12-08 00:55:56 -08:00
case "jpg":
2024-07-03 05:24:56 -07:00
rq.imgOpt = int64(*jpgQual)
2022-12-08 00:55:56 -08:00
default:
2022-12-07 23:44:09 -08:00
rq.imgType = *defType
2024-07-03 05:24:56 -07:00
rq.imgOpt = 80 // TODO: fixme, this needs to be different based on image type
2019-11-03 16:58:38 -08:00
}
2022-11-06 01:11:49 -08:00
log.Printf("%s WrpReq from UI Form: %+v\n", rq.r.RemoteAddr, rq)
2019-06-25 17:07:43 -07:00
}
2024-07-08 21:36:32 -07:00
func (rq *wrpReq) printUI(p uiParams) {
2022-11-06 01:11:49 -08:00
rq.w.Header().Set("Cache-Control", "max-age=0")
rq.w.Header().Set("Expires", "-1")
rq.w.Header().Set("Pragma", "no-cache")
rq.w.Header().Set("Content-Type", "text/html")
if p.bgColor == "" {
p.bgColor = "#FFFFFF"
}
data := uiData{
Version: version,
2024-07-03 05:24:56 -07:00
WrpMode: rq.wrpMode,
URL: rq.url,
2020-10-31 08:51:20 -07:00
BgColor: p.bgColor,
Width: rq.width,
Height: rq.height,
2024-07-03 05:24:56 -07:00
NColors: rq.colors, // TODO: this needs to be also jpeg quality
Zoom: rq.zoom,
2024-07-03 05:24:56 -07:00
MaxSize: rq.maxSize,
ImgType: rq.imgType,
2020-10-31 08:51:20 -07:00
ImgSize: p.imgSize,
ImgWidth: p.imgWidth,
ImgHeight: p.imgHeight,
ImgURL: p.imgURL,
MapURL: p.mapURL,
PageHeight: p.pageHeight,
2024-06-19 23:37:44 -07:00
TeXT: p.text,
2019-11-03 17:53:20 -08:00
}
2022-11-06 01:11:49 -08:00
err := htmlTmpl.Execute(rq.w, data)
if err != nil {
2024-06-22 15:40:37 -07:00
fmt.Fprintf(rq.w, "Error: %v", err)
2019-11-03 16:58:38 -08:00
}
2019-06-26 01:07:13 -07:00
}
2022-11-06 01:11:49 -08:00
func pageServer(w http.ResponseWriter, r *http.Request) {
log.Printf("%s Page Request for %s [%+v]\n", r.RemoteAddr, r.URL.Path, r.URL.RawQuery)
rq := wrpReq{
2022-11-06 01:11:49 -08:00
r: r,
w: w,
}
rq.parseForm()
if len(rq.url) < 4 {
2024-07-08 21:36:32 -07:00
rq.printUI(uiParams{bgColor: "#FFFFFF"})
return
}
2022-12-08 00:28:28 -08:00
rq.navigate() // TODO: if error from navigate do not capture
2024-07-03 05:24:56 -07:00
if rq.wrpMode == "html" {
2024-06-22 19:43:53 -07:00
rq.captureMarkdown()
2024-06-19 23:37:44 -07:00
return
}
2024-07-03 05:24:56 -07:00
rq.captureScreenshot()
}
2022-11-06 01:11:49 -08:00
func haltServer(w http.ResponseWriter, r *http.Request) {
log.Printf("%s Shutdown Request for %s\n", r.RemoteAddr, r.URL.Path)
w.Header().Set("Content-Type", "text/plain")
fmt.Fprintf(w, "Shutting down WRP...\n")
w.(http.Flusher).Flush()
time.Sleep(time.Second * 2)
cncl()
acncl()
srv.Shutdown(context.Background())
os.Exit(1)
}
2024-07-08 21:36:32 -07:00
func wrpTemplate(t string) string {
2020-10-29 07:16:14 -07:00
var tmpl []byte
fh, err := os.Open(t)
if err != nil {
2022-11-06 01:12:26 -08:00
goto builtin
2020-10-29 07:16:14 -07:00
}
2022-12-07 23:50:58 -08:00
defer fh.Close()
2024-07-03 05:24:56 -07:00
tmpl, err = io.ReadAll(fh)
2020-10-29 07:16:14 -07:00
if err != nil {
2022-11-06 01:12:26 -08:00
goto builtin
2020-10-29 07:16:14 -07:00
}
2022-12-07 23:50:58 -08:00
log.Printf("Got HTML UI template from %v file, size %v \n", t, len(tmpl))
2020-10-29 07:16:14 -07:00
return string(tmpl)
2022-11-06 01:12:26 -08:00
builtin:
2022-11-30 02:00:53 -08:00
fhs, err := fs.Open("wrp.html")
2020-10-29 07:16:14 -07:00
if err != nil {
log.Fatal(err)
}
2022-12-07 23:50:58 -08:00
defer fhs.Close()
2020-10-29 07:16:14 -07:00
2024-07-03 05:24:56 -07:00
tmpl, err = io.ReadAll(fhs)
2020-10-29 07:16:14 -07:00
if err != nil {
log.Fatal(err)
}
2022-12-07 23:50:58 -08:00
log.Printf("Got HTML UI template from embed\n")
2020-10-29 07:16:14 -07:00
return string(tmpl)
}
2019-05-29 01:29:01 -07:00
func main() {
var err error
2024-05-23 00:34:00 -07:00
log.SetFlags(log.LstdFlags | log.Lshortfile)
2019-05-29 01:52:28 -07:00
flag.Parse()
2024-05-23 00:34:00 -07:00
log.Printf("Web Rendering Proxy Version %s (%v)\n", version, runtime.GOARCH)
2022-12-08 01:49:46 -08:00
log.Printf("Args: %q", os.Args)
if len(os.Getenv("PORT")) > 0 {
2022-12-07 23:44:09 -08:00
*addr = ":" + os.Getenv(("PORT"))
}
2024-07-08 21:36:32 -07:00
printMyIPs(*addr)
2022-12-07 23:44:09 -08:00
n, err := fmt.Sscanf(*fgeom, "%dx%dx%d", &defGeom.w, &defGeom.h, &defGeom.c)
if err != nil || n != 3 {
log.Fatalf("Unable to parse -g geometry flag / %s", err)
}
2024-07-03 05:24:56 -07:00
cncl, acncl = chromedpStart()
defer cncl()
2024-07-03 05:24:56 -07:00
defer acncl()
2019-07-16 22:29:35 -07:00
c := make(chan os.Signal)
signal.Notify(c, os.Interrupt, syscall.SIGTERM)
go func() {
<-c
log.Printf("Interrupt - shutting down.")
cncl()
acncl()
2019-07-16 22:29:35 -07:00
srv.Shutdown(context.Background())
os.Exit(1)
}()
2019-05-29 01:52:28 -07:00
http.HandleFunc("/", pageServer)
2019-06-26 01:07:13 -07:00
http.HandleFunc("/map/", mapServer)
2024-07-08 21:36:32 -07:00
http.HandleFunc("/img/", imgServerMap)
http.HandleFunc(imgZpfx, imgServerTxt)
2019-06-17 23:53:22 -07:00
http.HandleFunc("/shutdown/", haltServer)
2019-05-29 18:47:03 -07:00
http.HandleFunc("/favicon.ico", http.NotFound)
2022-12-07 23:44:09 -08:00
log.Printf("Default Img Type: %v, Geometry: %+v", *defType, defGeom)
2024-07-08 21:36:32 -07:00
htmlTmpl, err = template.New("wrp.html").Parse(wrpTemplate(*htmFnam))
2020-10-29 07:16:14 -07:00
if err != nil {
log.Fatal(err)
}
2022-12-08 01:49:46 -08:00
log.Print("Starting WRP http server")
2022-12-07 23:44:09 -08:00
srv.Addr = *addr
err = srv.ListenAndServe()
2019-06-17 23:53:22 -07:00
if err != nil {
log.Fatal(err)
}
2019-05-29 01:29:01 -07:00
}