ref: 545c10329eb79633bf2dad81fd32576fd486b0da
dir: /domino/domino.go/
package domino import ( "fmt" "github.com/dop251/goja" "github.com/dop251/goja_nodejs/console" "github.com/dop251/goja_nodejs/eventloop" "github.com/dop251/goja_nodejs/require" "github.com/jvatic/goja-babel" "golang.org/x/net/html" "io/ioutil" "log" "opossum" "opossum/nodes" "strconv" "strings" "time" ) var DebugDumpJS *bool type Domino struct { initialized bool loop *eventloop.EventLoop html string outputHtml string domChanged chan int } func NewDomino(html string) (d *Domino) { d = &Domino{ html: html, } return } func (d *Domino) Start() { log.Printf("Start event loop") d.loop = eventloop.NewEventLoop() d.loop.Start() log.Printf("event loop started") } func (d *Domino) Stop() { d.loop.Stop() } func IntrospectError(err error, script string) { prefix := "Line " i := strings.Index(err.Error(), prefix) if i > 0 { i += len(prefix) s := err.Error()[i:] yxStart := strings.Split(s, " ")[0] yx := strings.Split(yxStart, ":") y, _ := strconv.Atoi(yx[0]) x, _ := strconv.Atoi(yx[1]) lines := strings.Split(script, "\n") if wholeLine := lines[y-1]; len(wholeLine) > 100 { from := x - 50 to := x + 50 if from < 0 { from = 0 } if to >= len(wholeLine) { to = len(wholeLine) - 1 } log.Printf("the line: %v", wholeLine[from:to]) } else { if y > 0 && len(lines[y-1]) < 120 { log.Printf("%v: %v", y-1, lines[y-1]) } log.Printf("%v: %v", y, lines[y]) if y+1 < len(lines) && len(lines[y+1]) < 120 { log.Printf("%v: %v", y+1, lines[y+1]) } } } } func (d *Domino) Exec(script string, initial bool) (res string, err error) { if !initial && !d.initialized { initial = true } script = strings.Replace(script, "const ", "var ", -1) script = strings.Replace(script, "let ", "var ", -1) script = strings.Replace(script, "<!--", "", -1) SCRIPT := ` global = {}; //global.__domino_frozen__ = true; // Must precede any require('domino') var domino = require('domino-lib/index'); var Element = domino.impl.Element; // etc Object.assign(this, domino.createWindow(s.html, 'http://example.com')); window = this; window.parent = window; window.top = window; window.self = window; addEventListener = function() {}; window.location.href = 'http://example.com'; location = window.location; navigator = { userAgent: 'opossum' }; HTMLElement = domino.impl.HTMLElement; // Fire DOMContentLoaded to trigger $(document).ready(..) document.close(); ` + script if !initial { SCRIPT = script } if *DebugDumpJS { ioutil.WriteFile("main.js", []byte(SCRIPT), 0644) } ready := make(chan goja.Value) go func() { d.loop.RunOnLoop(func(vm *goja.Runtime) { log.Printf("RunOnLoop") if initial { registry := require.NewRegistry( require.WithGlobalFolders(".", ".."), ) console.Enable(vm) req := registry.Enable(vm) _ = req vm.SetFieldNameMapper(goja.TagFieldNameMapper("json", true)) type S struct { Buf string `json:"buf"` HTML string `json:"html"` } vm.Set("s", S{ HTML: d.html, Buf: "yolo", }) } vv, err := vm.RunString(SCRIPT) if err != nil { log.Printf("run program: %v", err) IntrospectError(err, script) } ready <- vv }) }() v := <-ready <-time.After(10 * time.Millisecond) if v != nil { res = v.String() } if err == nil { d.initialized=true } return } func (d *Domino) Exec6(script string) (res string, err error) { babel.Init(4) // Setup 4 transformers (can be any number > 0) r, err := babel.Transform(strings.NewReader(script), map[string]interface{}{ "plugins": []string{ "transform-react-jsx", "transform-es2015-block-scoping", }, }) if err != nil { return "", fmt.Errorf("babel: %v", err) } buf, err := ioutil.ReadAll(r) if err != nil { return "", fmt.Errorf("read all: %v", err) } return d.Exec(string(buf), true) } // TriggerClick, and return the result html // ...then HTML5 parse it, diff the node tree // (probably faster and cleaner than anything else) func (d *Domino) TriggerClick(selector string) (newHTML string, ok bool, err error) { res, err := d.Exec(` var sel = '` + selector + `'; var el = document.querySelector(sel); console.log('query ' + sel); if (el._listeners && el._listeners.click) { var fn = el.click.bind(el); if (fn) { console.log(' call click handler...'); fn(); } !!fn; } else { false; } `, false) if ok = res == "true"; ok { newHTML, ok, err = d.TrackChanges() } return } // Put change into html (e.g. from input field mutation) func (d *Domino) PutAttr(selector, attr, val string) (ok bool, err error) { res, err := d.Exec(` var sel = '` + selector + `'; var el = document.querySelector(sel); el.attr('` + attr + `', '` + val + `'); !!el; `, false) ok = res == "true" return } func (d *Domino) TrackChanges() (html string, changed bool, err error) { html, err = d.Exec("document.querySelector('html').innerHTML;", false) if err != nil { return } changed = d.outputHtml != html d.outputHtml = html return } func Srcs(doc *nodes.Node) (srcs []string) { srcs = make([]string, 0, 3) iterateJsElements(doc, func(src, inlineCode string) { if src = strings.TrimSpace(src); src != "" && !blocked(src) { srcs = append(srcs, src) } }) return } func blocked(src string) bool { for _, s := range []string{"adsense", "adsystem", "adservice", "googletagservice", "googletagmanager", "script.ioam.de","googlesyndication","adserver", "nativeads", "prebid", ".ads."} { if strings.Contains(src, s) { return true } } return false } func Scripts(doc *nodes.Node, downloads map[string]string) (codes []string) { codes = make([]string, 0, 3) iterateJsElements(doc, func(src, inlineCode string) { if strings.TrimSpace(inlineCode) != "" { codes = append(codes, inlineCode) } else if c, ok := downloads[src]; ok { codes = append(codes, c) } }) return } func iterateJsElements(doc *nodes.Node, fn func(src string, inlineCode string)) { var f func(n *nodes.Node) f = func(n *nodes.Node) { if n.Type() == html.ElementNode && n.Data() == "script" { isJS := true src := "" for _, a := range n.Attrs { switch strings.ToLower(a.Key) { case "type": t, err := opossum.NewContentType(a.Val, nil) if err != nil { log.Printf("t: %v", err) } if a.Val == "" || t.IsJS() { isJS = true } else { isJS = false } case "src": src = a.Val } } if isJS { fn(src, nodes.ContentFrom(*n)) } } for _, c := range n.Children { f(c) } } f(doc) return } // AJAX: // https://stackoverflow.com/questions/7086858/loading-ajax-app-with-jsdom // Babel on Goja: // https://github.com/dop251/goja/issues/5#issuecomment-259996573 // Goja supports ES5.1 which is essentially JS assembly: // https://github.com/dop251/goja/issues/76#issuecomment-399253779