URL https://opencores.org/ocsvn/openrisc/openrisc/trunk

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [libgo/] [go/] [html/] [template/] [escape.go] - Blame information for rev 747

Details | Compare with Previous | View Log


// Copyright 2011 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
 
package template
 
import (
        "bytes"
        "fmt"
        "html"
        "text/template"
        "text/template/parse"
)
 
// escapeTemplates rewrites the named templates, which must be
// associated with t, to guarantee that the output of any of the named
// templates is properly escaped.  Names should include the names of
// all templates that might be Executed but need not include helper
// templates.  If no error is returned, then the named templates have
// been modified.  Otherwise the named templates have been rendered
// unusable.
func escapeTemplates(tmpl *Template, names ...string) error {
        e := newEscaper(tmpl)
        for _, name := range names {
                c, _ := e.escapeTree(context{}, name, 0)
                var err error
                if c.err != nil {
                        err, c.err.Name = c.err, name
                } else if c.state != stateText {
                        err = &Error{ErrEndContext, name, 0, fmt.Sprintf("ends in a non-text context: %v", c)}
                }
                if err != nil {
                        // Prevent execution of unsafe templates.
                        for _, name := range names {
                                if t := tmpl.set[name]; t != nil {
                                        t.text.Tree = nil
                                }
                        }
                        return err
                }
                tmpl.escaped = true
        }
        e.commit()
        return nil
}
 
// funcMap maps command names to functions that render their inputs safe.
var funcMap = template.FuncMap{
        "exp_template_html_attrescaper":     attrEscaper,
        "exp_template_html_commentescaper":  commentEscaper,
        "exp_template_html_cssescaper":      cssEscaper,
        "exp_template_html_cssvaluefilter":  cssValueFilter,
        "exp_template_html_htmlnamefilter":  htmlNameFilter,
        "exp_template_html_htmlescaper":     htmlEscaper,
        "exp_template_html_jsregexpescaper": jsRegexpEscaper,
        "exp_template_html_jsstrescaper":    jsStrEscaper,
        "exp_template_html_jsvalescaper":    jsValEscaper,
        "exp_template_html_nospaceescaper":  htmlNospaceEscaper,
        "exp_template_html_rcdataescaper":   rcdataEscaper,
        "exp_template_html_urlescaper":      urlEscaper,
        "exp_template_html_urlfilter":       urlFilter,
        "exp_template_html_urlnormalizer":   urlNormalizer,
}
 
// equivEscapers matches contextual escapers to equivalent template builtins.
var equivEscapers = map[string]string{
        "exp_template_html_attrescaper":    "html",
        "exp_template_html_htmlescaper":    "html",
        "exp_template_html_nospaceescaper": "html",
        "exp_template_html_rcdataescaper":  "html",
        "exp_template_html_urlescaper":     "urlquery",
        "exp_template_html_urlnormalizer":  "urlquery",
}
 
// escaper collects type inferences about templates and changes needed to make
// templates injection safe.
type escaper struct {
        tmpl *Template
        // output[templateName] is the output context for a templateName that
        // has been mangled to include its input context.
        output map[string]context
        // derived[c.mangle(name)] maps to a template derived from the template
        // named name templateName for the start context c.
        derived map[string]*template.Template
        // called[templateName] is a set of called mangled template names.
        called map[string]bool
        // xxxNodeEdits are the accumulated edits to apply during commit.
        // Such edits are not applied immediately in case a template set
        // executes a given template in different escaping contexts.
        actionNodeEdits   map[*parse.ActionNode][]string
        templateNodeEdits map[*parse.TemplateNode]string
        textNodeEdits     map[*parse.TextNode][]byte
}
 
// newEscaper creates a blank escaper for the given set.
func newEscaper(t *Template) *escaper {
        return &escaper{
                t,
                map[string]context{},
                map[string]*template.Template{},
                map[string]bool{},
                map[*parse.ActionNode][]string{},
                map[*parse.TemplateNode]string{},
                map[*parse.TextNode][]byte{},
        }
}
 
// filterFailsafe is an innocuous word that is emitted in place of unsafe values
// by sanitizer functions. It is not a keyword in any programming language,
// contains no special characters, is not empty, and when it appears in output
// it is distinct enough that a developer can find the source of the problem
// via a search engine.
const filterFailsafe = "ZgotmplZ"
 
// escape escapes a template node.
func (e *escaper) escape(c context, n parse.Node) context {
        switch n := n.(type) {
        case *parse.ActionNode:
                return e.escapeAction(c, n)
        case *parse.IfNode:
                return e.escapeBranch(c, &n.BranchNode, "if")
        case *parse.ListNode:
                return e.escapeList(c, n)
        case *parse.RangeNode:
                return e.escapeBranch(c, &n.BranchNode, "range")
        case *parse.TemplateNode:
                return e.escapeTemplate(c, n)
        case *parse.TextNode:
                return e.escapeText(c, n)
        case *parse.WithNode:
                return e.escapeBranch(c, &n.BranchNode, "with")
        }
        panic("escaping " + n.String() + " is unimplemented")
}
 
// escapeAction escapes an action template node.
func (e *escaper) escapeAction(c context, n *parse.ActionNode) context {
        if len(n.Pipe.Decl) != 0 {
                // A local variable assignment, not an interpolation.
                return c
        }
        c = nudge(c)
        s := make([]string, 0, 3)
        switch c.state {
        case stateError:
                return c
        case stateURL, stateCSSDqStr, stateCSSSqStr, stateCSSDqURL, stateCSSSqURL, stateCSSURL:
                switch c.urlPart {
                case urlPartNone:
                        s = append(s, "exp_template_html_urlfilter")
                        fallthrough
                case urlPartPreQuery:
                        switch c.state {
                        case stateCSSDqStr, stateCSSSqStr:
                                s = append(s, "exp_template_html_cssescaper")
                        default:
                                s = append(s, "exp_template_html_urlnormalizer")
                        }
                case urlPartQueryOrFrag:
                        s = append(s, "exp_template_html_urlescaper")
                case urlPartUnknown:
                        return context{
                                state: stateError,
                                err:   errorf(ErrAmbigContext, n.Line, "%s appears in an ambiguous URL context", n),
                        }
                default:
                        panic(c.urlPart.String())
                }
        case stateJS:
                s = append(s, "exp_template_html_jsvalescaper")
                // A slash after a value starts a div operator.
                c.jsCtx = jsCtxDivOp
        case stateJSDqStr, stateJSSqStr:
                s = append(s, "exp_template_html_jsstrescaper")
        case stateJSRegexp:
                s = append(s, "exp_template_html_jsregexpescaper")
        case stateCSS:
                s = append(s, "exp_template_html_cssvaluefilter")
        case stateText:
                s = append(s, "exp_template_html_htmlescaper")
        case stateRCDATA:
                s = append(s, "exp_template_html_rcdataescaper")
        case stateAttr:
                // Handled below in delim check.
        case stateAttrName, stateTag:
                c.state = stateAttrName
                s = append(s, "exp_template_html_htmlnamefilter")
        default:
                if isComment(c.state) {
                        s = append(s, "exp_template_html_commentescaper")
                } else {
                        panic("unexpected state " + c.state.String())
                }
        }
        switch c.delim {
        case delimNone:
                // No extra-escaping needed for raw text content.
        case delimSpaceOrTagEnd:
                s = append(s, "exp_template_html_nospaceescaper")
        default:
                s = append(s, "exp_template_html_attrescaper")
        }
        e.editActionNode(n, s)
        return c
}
 
// ensurePipelineContains ensures that the pipeline has commands with
// the identifiers in s in order.
// If the pipeline already has some of the sanitizers, do not interfere.
// For example, if p is (.X | html) and s is ["escapeJSVal", "html"] then it
// has one matching, "html", and one to insert, "escapeJSVal", to produce
// (.X | escapeJSVal | html).
func ensurePipelineContains(p *parse.PipeNode, s []string) {
        if len(s) == 0 {
                return
        }
        n := len(p.Cmds)
        // Find the identifiers at the end of the command chain.
        idents := p.Cmds
        for i := n - 1; i >= 0; i-- {
                if cmd := p.Cmds[i]; len(cmd.Args) != 0 {
                        if id, ok := cmd.Args[0].(*parse.IdentifierNode); ok {
                                if id.Ident == "noescape" {
                                        return
                                }
                                continue
                        }
                }
                idents = p.Cmds[i+1:]
        }
        dups := 0
        for _, id := range idents {
                if escFnsEq(s[dups], (id.Args[0].(*parse.IdentifierNode)).Ident) {
                        dups++
                        if dups == len(s) {
                                return
                        }
                }
        }
        newCmds := make([]*parse.CommandNode, n-len(idents), n+len(s)-dups)
        copy(newCmds, p.Cmds)
        // Merge existing identifier commands with the sanitizers needed.
        for _, id := range idents {
                i := indexOfStr((id.Args[0].(*parse.IdentifierNode)).Ident, s, escFnsEq)
                if i != -1 {
                        for _, name := range s[:i] {
                                newCmds = appendCmd(newCmds, newIdentCmd(name))
                        }
                        s = s[i+1:]
                }
                newCmds = appendCmd(newCmds, id)
        }
        // Create any remaining sanitizers.
        for _, name := range s {
                newCmds = appendCmd(newCmds, newIdentCmd(name))
        }
        p.Cmds = newCmds
}
 
// redundantFuncs[a][b] implies that funcMap[b](funcMap[a](x)) == funcMap[a](x)
// for all x.
var redundantFuncs = map[string]map[string]bool{
        "exp_template_html_commentescaper": {
                "exp_template_html_attrescaper":    true,
                "exp_template_html_nospaceescaper": true,
                "exp_template_html_htmlescaper":    true,
        },
        "exp_template_html_cssescaper": {
                "exp_template_html_attrescaper": true,
        },
        "exp_template_html_jsregexpescaper": {
                "exp_template_html_attrescaper": true,
        },
        "exp_template_html_jsstrescaper": {
                "exp_template_html_attrescaper": true,
        },
        "exp_template_html_urlescaper": {
                "exp_template_html_urlnormalizer": true,
        },
}
 
// appendCmd appends the given command to the end of the command pipeline
// unless it is redundant with the last command.
func appendCmd(cmds []*parse.CommandNode, cmd *parse.CommandNode) []*parse.CommandNode {
        if n := len(cmds); n != 0 {
                last, ok := cmds[n-1].Args[0].(*parse.IdentifierNode)
                next, _ := cmd.Args[0].(*parse.IdentifierNode)
                if ok && redundantFuncs[last.Ident][next.Ident] {
                        return cmds
                }
        }
        return append(cmds, cmd)
}
 
// indexOfStr is the first i such that eq(s, strs[i]) or -1 if s was not found.
func indexOfStr(s string, strs []string, eq func(a, b string) bool) int {
        for i, t := range strs {
                if eq(s, t) {
                        return i
                }
        }
        return -1
}
 
// escFnsEq returns whether the two escaping functions are equivalent.
func escFnsEq(a, b string) bool {
        if e := equivEscapers[a]; e != "" {
                a = e
        }
        if e := equivEscapers[b]; e != "" {
                b = e
        }
        return a == b
}
 
// newIdentCmd produces a command containing a single identifier node.
func newIdentCmd(identifier string) *parse.CommandNode {
        return &parse.CommandNode{
                NodeType: parse.NodeCommand,
                Args:     []parse.Node{parse.NewIdentifier(identifier)},
        }
}
 
// nudge returns the context that would result from following empty string
// transitions from the input context.
// For example, parsing:
//     `
// will end in context{stateBeforeValue, attrURL}, but parsing one extra rune:
//     `
// will end in context{stateURL, delimSpaceOrTagEnd, ...}.
// There are two transitions that happen when the 'x' is seen:
// (1) Transition from a before-value state to a start-of-value state without
//     consuming any character.
// (2) Consume 'x' and transition past the first value character.
// In this case, nudging produces the context after (1) happens.
func nudge(c context) context {
        switch c.state {
        case stateTag:
                // In `
                c.state = stateAttrName
        case stateBeforeValue:
                // In `
                c.state, c.delim, c.attr = attrStartStates[c.attr], delimSpaceOrTagEnd, attrNone
        case stateAfterName:
                // In `
                c.state, c.attr = stateAttrName, attrNone
        }
        return c
}
 
// join joins the two contexts of a branch template node. The result is an
// error context if either of the input contexts are error contexts, or if the
// the input contexts differ.
func join(a, b context, line int, nodeName string) context {
        if a.state == stateError {
                return a
        }
        if b.state == stateError {
                return b
        }
        if a.eq(b) {
                return a
        }
 
        c := a
        c.urlPart = b.urlPart
        if c.eq(b) {
                // The contexts differ only by urlPart.
                c.urlPart = urlPartUnknown
                return c
        }
 
        c = a
        c.jsCtx = b.jsCtx
        if c.eq(b) {
                // The contexts differ only by jsCtx.
                c.jsCtx = jsCtxUnknown
                return c
        }
 
        // Allow a nudged context to join with an unnudged one.
        // This means that
        //   
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
 
 
 
// 
// 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
var 
 
 
 
 
 
 
 
 
 
 
 
 
var 
 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 
// 
// 
func 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
// 
func 
 
 
 
 
 
 

powered // ends in an unquoted value state even though the else branch // ends in stateBeforeValue. if c, d := nudge(a), nudge(b); !(c.eq(a) && d.eq(b)) { if e := join(c, d, line, nodeName); e.state != stateError { return e } } return context{ state: stateError, err: errorf(ErrBranchEnd, line, "{{%s}} branches end in different contexts: %v, %v", nodeName, a, b), } } escapeBranch escapes a branch template node: "if", "range" and "with". (e *escaper) escapeBranch(c context, n *parse.BranchNode, nodeName string) context { c0 := e.escapeList(c, n.List) if nodeName == "range" && c0.state != stateError { // The "true" branch of a "range" node can execute multiple times. // We check that executing n.List once results in the same context // as executing n.List twice. c1, _ := e.escapeListConditionally(c0, n.List, nil) c0 = join(c0, c1, n.Line, nodeName) if c0.state == stateError { // Make clear that this is a problem on loop re-entry // since developers tend to overlook that branch when // debugging templates. c0.err.Line = n.Line c0.err.Description = "on range loop re-entry: " + c0.err.Description return c0 } } c1 := e.escapeList(c, n.ElseList) return join(c0, c1, n.Line, nodeName) } escapeList escapes a list template node. (e *escaper) escapeList(c context, n *parse.ListNode) context { if n == nil { return c } for _, m := range n.Nodes { c = e.escape(c, m) } return c } escapeListConditionally escapes a list node but only preserves edits and inferences in e if the inferences and output context satisfy filter. It returns the best guess at an output context, and the result of the filter which is the same as whether e was updated. (e *escaper) escapeListConditionally(c context, n *parse.ListNode, filter func(*escaper, context) bool) (context, bool) { e1 := newEscaper(e.tmpl) // Make type inferences available to f. for k, v := range e.output { e1.output[k] = v } c = e1.escapeList(c, n) ok := filter != nil && filter(e1, c) if ok { // Copy inferences and edits from e1 back into e. for k, v := range e1.output { e.output[k] = v } for k, v := range e1.derived { e.derived[k] = v } for k, v := range e1.called { e.called[k] = v } for k, v := range e1.actionNodeEdits { e.editActionNode(k, v) } for k, v := range e1.templateNodeEdits { e.editTemplateNode(k, v) } for k, v := range e1.textNodeEdits { e.editTextNode(k, v) } } return c, ok } escapeTemplate escapes a {{template}} call node. (e *escaper) escapeTemplate(c context, n *parse.TemplateNode) context { c, name := e.escapeTree(c, n.Name, n.Line) if name != n.Name { e.editTemplateNode(n, name) } return c } escapeTree escapes the named template starting in the given context as necessary and returns its output context. (e *escaper) escapeTree(c context, name string, line int) (context, string) { // Mangle the template name with the input context to produce a reliable // identifier. dname := c.mangle(name) e.called[dname] = true if out, ok := e.output[dname]; ok { // Already escaped. return out, dname } t := e.template(name) if t == nil { // Two cases: The template exists but is empty, or has never been mentioned at // all. Distinguish the cases in the error messages. if e.tmpl.set[name] != nil { return context{ state: stateError, err: errorf(ErrNoSuchTemplate, line, "%q is an incomplete or empty template", name), }, dname } return context{ state: stateError, err: errorf(ErrNoSuchTemplate, line, "no such template %q", name), }, dname } if dname != name { // Use any template derived during an earlier call to escapeTemplate // with different top level templates, or clone if necessary. dt := e.template(dname) if dt == nil { dt = template.New(dname) dt.Tree = &parse.Tree{Name: dname, Root: cloneList(t.Root)} e.derived[dname] = dt } t = dt } return e.computeOutCtx(c, t), dname } computeOutCtx takes a template and its start context and computes the output context while storing any inferences in e. (e *escaper) computeOutCtx(c context, t *template.Template) context { // Propagate context over the body. c1, ok := e.escapeTemplateBody(c, t) if !ok { // Look for a fixed point by assuming c1 as the output context. if c2, ok2 := e.escapeTemplateBody(c1, t); ok2 { c1, ok = c2, true } // Use c1 as the error context if neither assumption worked. } if !ok && c1.state != stateError { return context{ state: stateError, // TODO: Find the first node with a line in t.text.Tree.Root err: errorf(ErrOutputContext, 0, "cannot compute output context for template %s", t.Name()), } } return c1 } escapeTemplateBody escapes the given template assuming the given output context, and returns the best guess at the output context and whether the assumption was correct. (e *escaper) escapeTemplateBody(c context, t *template.Template) (context, bool) { filter := func(e1 *escaper, c1 context) bool { if c1.state == stateError { // Do not update the input escaper, e. return false } if !e1.called[t.Name()] { // If t is not recursively called, then c1 is an // accurate output context. return true } // c1 is accurate if it matches our assumed output context. return c.eq(c1) } // We need to assume an output context so that recursive template calls // take the fast path out of escapeTree instead of infinitely recursing. // Naively assuming that the input context is the same as the output // works >90% of the time. e.output[t.Name()] = c return e.escapeListConditionally(c, t.Tree.Root, filter) } delimEnds maps each delim to a string of characters that terminate it. delimEnds = [...]string{ delimDoubleQuote: `"`, delimSingleQuote: "'", // Determined empirically by running the below in various browsers. // var div = document.createElement("DIV"); // for (var i = 0; i < 0x10000; ++i) { // div.innerHTML = ""; // if (div.getElementsByTagName("SPAN")[0].title.indexOf("bar") < 0) // document.write("

U+" + i.toString(16)); // } delimSpaceOrTagEnd: " \t\n\f\r>", } doctypeBytes = []byte(" escapeText escapes a text template node. (e *escaper) escapeText(c context, n *parse.TextNode) context { s, written, i, b := n.Text, 0, 0, new(bytes.Buffer) for i != len(s) { c1, nread := contextAfterText(c, s[i:]) i1 := i + nread if c.state == stateText || c.state == stateRCDATA { end := i1 if c1.state != c.state { for j := end - 1; j >= i; j-- { if s[j] == '<' { end = j break } } } for j := i; j < end; j++ { if s[j] == '<' && !bytes.HasPrefix(s[j:], doctypeBytes) { b.Write(s[written:j]) b.WriteString("<") written = j + 1 } } } else if isComment(c.state) && c.delim == delimNone { switch c.state { case stateJSBlockCmt: // http://es5.github.com/#x7.4: // "Comments behave like white space and are // discarded except that, if a MultiLineComment // contains a line terminator character, then // the entire comment is considered to be a // LineTerminator for purposes of parsing by // the syntactic grammar." if bytes.IndexAny(s[written:i1], "\n\r\u2028\u2029") != -1 { b.WriteByte('\n') } else { b.WriteByte(' ') } case stateCSSBlockCmt: b.WriteByte(' ') } written = i1 } if c.state != c1.state && isComment(c1.state) && c1.delim == delimNone { // Preserve the portion between written and the comment start. cs := i1 - 2 if c1.state == stateHTMLCmt { // "

Browse

Tools

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [libgo/] [go/] [html/] [template/] [escape.go] - Blame information for rev 747

Line No.	Rev	Author	Line
1	747	jeremybenn	`// Copyright 2011 The Go Authors. All rights reserved.`
2			`// Use of this source code is governed by a BSD-style`
3			`// license that can be found in the LICENSE file.`
4
5			`package template`
6
7			`import (`
8			`"bytes"`
9			`"fmt"`
10			`"html"`
11			`"text/template"`
12			`"text/template/parse"`
13			`)`
14
15			`// escapeTemplates rewrites the named templates, which must be`
16			`// associated with t, to guarantee that the output of any of the named`
17			`// templates is properly escaped. Names should include the names of`
18			`// all templates that might be Executed but need not include helper`
19			`// templates. If no error is returned, then the named templates have`
20			`// been modified. Otherwise the named templates have been rendered`
21			`// unusable.`
22			`func escapeTemplates(tmpl *Template, names ...string) error {`
23			`e := newEscaper(tmpl)`
24			`for _, name := range names {`
25			`c, _ := e.escapeTree(context{}, name, 0)`
26			`var err error`
27			`if c.err != nil {`
28			`err, c.err.Name = c.err, name`
29			`} else if c.state != stateText {`
30			`err = &Error{ErrEndContext, name, 0, fmt.Sprintf("ends in a non-text context: %v", c)}`
31			`}`
32			`if err != nil {`
33			`// Prevent execution of unsafe templates.`
34			`for _, name := range names {`
35			`if t := tmpl.set[name]; t != nil {`
36			`t.text.Tree = nil`
37			`}`
38			`}`
39			`return err`
40			`}`
41			`tmpl.escaped = true`
42			`}`
43			`e.commit()`
44			`return nil`
45			`}`
46
47			`// funcMap maps command names to functions that render their inputs safe.`
48			`var funcMap = template.FuncMap{`
49			`"exp_template_html_attrescaper": attrEscaper,`
50			`"exp_template_html_commentescaper": commentEscaper,`
51			`"exp_template_html_cssescaper": cssEscaper,`
52			`"exp_template_html_cssvaluefilter": cssValueFilter,`
53			`"exp_template_html_htmlnamefilter": htmlNameFilter,`
54			`"exp_template_html_htmlescaper": htmlEscaper,`
55			`"exp_template_html_jsregexpescaper": jsRegexpEscaper,`
56			`"exp_template_html_jsstrescaper": jsStrEscaper,`
57			`"exp_template_html_jsvalescaper": jsValEscaper,`
58			`"exp_template_html_nospaceescaper": htmlNospaceEscaper,`
59			`"exp_template_html_rcdataescaper": rcdataEscaper,`
60			`"exp_template_html_urlescaper": urlEscaper,`
61			`"exp_template_html_urlfilter": urlFilter,`
62			`"exp_template_html_urlnormalizer": urlNormalizer,`
63			`}`
64
65			`// equivEscapers matches contextual escapers to equivalent template builtins.`
66			`var equivEscapers = map[string]string{`
67			`"exp_template_html_attrescaper": "html",`
68			`"exp_template_html_htmlescaper": "html",`
69			`"exp_template_html_nospaceescaper": "html",`
70			`"exp_template_html_rcdataescaper": "html",`
71			`"exp_template_html_urlescaper": "urlquery",`
72			`"exp_template_html_urlnormalizer": "urlquery",`
73			`}`
74
75			`// escaper collects type inferences about templates and changes needed to make`
76			`// templates injection safe.`
77			`type escaper struct {`
78			`tmpl *Template`
79			`// output[templateName] is the output context for a templateName that`
80			`// has been mangled to include its input context.`
81			`output map[string]context`
82			`// derived[c.mangle(name)] maps to a template derived from the template`
83			`// named name templateName for the start context c.`
84			`derived map[string]*template.Template`
85			`// called[templateName] is a set of called mangled template names.`
86			`called map[string]bool`
87			`// xxxNodeEdits are the accumulated edits to apply during commit.`
88			`// Such edits are not applied immediately in case a template set`
89			`// executes a given template in different escaping contexts.`
90			`actionNodeEdits map[*parse.ActionNode][]string`
91			`templateNodeEdits map[*parse.TemplateNode]string`
92			`textNodeEdits map[*parse.TextNode][]byte`
93			`}`
94
95			`// newEscaper creates a blank escaper for the given set.`
96			`func newEscaper(t Template) escaper {`
97			`return &escaper{`
98			`t,`
99			`map[string]context{},`
100			`map[string]*template.Template{},`
101			`map[string]bool{},`
102			`map[*parse.ActionNode][]string{},`
103			`map[*parse.TemplateNode]string{},`
104			`map[*parse.TextNode][]byte{},`
105			`}`
106			`}`
107
108			`// filterFailsafe is an innocuous word that is emitted in place of unsafe values`
109			`// by sanitizer functions. It is not a keyword in any programming language,`
110			`// contains no special characters, is not empty, and when it appears in output`
111			`// it is distinct enough that a developer can find the source of the problem`
112			`// via a search engine.`
113			`const filterFailsafe = "ZgotmplZ"`
114
115			`// escape escapes a template node.`
116			`func (e *escaper) escape(c context, n parse.Node) context {`
117			`switch n := n.(type) {`
118			`case *parse.ActionNode:`
119			`return e.escapeAction(c, n)`
120			`case *parse.IfNode:`
121			`return e.escapeBranch(c, &n.BranchNode, "if")`
122			`case *parse.ListNode:`
123			`return e.escapeList(c, n)`
124			`case *parse.RangeNode:`
125			`return e.escapeBranch(c, &n.BranchNode, "range")`
126			`case *parse.TemplateNode:`
127			`return e.escapeTemplate(c, n)`
128			`case *parse.TextNode:`
129			`return e.escapeText(c, n)`
130			`case *parse.WithNode:`
131			`return e.escapeBranch(c, &n.BranchNode, "with")`
132			`}`
133			`panic("escaping " + n.String() + " is unimplemented")`
134			`}`
135
136			`// escapeAction escapes an action template node.`
137			`func (e escaper) escapeAction(c context, n parse.ActionNode) context {`
138			`if len(n.Pipe.Decl) != 0 {`
139			`// A local variable assignment, not an interpolation.`
140			`return c`
141			`}`
142			`c = nudge(c)`
143			`s := make([]string, 0, 3)`
144			`switch c.state {`
145			`case stateError:`
146			`return c`
147			`case stateURL, stateCSSDqStr, stateCSSSqStr, stateCSSDqURL, stateCSSSqURL, stateCSSURL:`
148			`switch c.urlPart {`
149			`case urlPartNone:`
150			`s = append(s, "exp_template_html_urlfilter")`
151			`fallthrough`
152			`case urlPartPreQuery:`
153			`switch c.state {`
154			`case stateCSSDqStr, stateCSSSqStr:`
155			`s = append(s, "exp_template_html_cssescaper")`
156			`default:`
157			`s = append(s, "exp_template_html_urlnormalizer")`
158			`}`
159			`case urlPartQueryOrFrag:`
160			`s = append(s, "exp_template_html_urlescaper")`
161			`case urlPartUnknown:`
162			`return context{`
163			`state: stateError,`
164			`err: errorf(ErrAmbigContext, n.Line, "%s appears in an ambiguous URL context", n),`
165			`}`
166			`default:`
167			`panic(c.urlPart.String())`
168			`}`
169			`case stateJS:`
170			`s = append(s, "exp_template_html_jsvalescaper")`
171			`// A slash after a value starts a div operator.`
172			`c.jsCtx = jsCtxDivOp`
173			`case stateJSDqStr, stateJSSqStr:`
174			`s = append(s, "exp_template_html_jsstrescaper")`
175			`case stateJSRegexp:`
176			`s = append(s, "exp_template_html_jsregexpescaper")`
177			`case stateCSS:`
178			`s = append(s, "exp_template_html_cssvaluefilter")`
179			`case stateText:`
180			`s = append(s, "exp_template_html_htmlescaper")`
181			`case stateRCDATA:`
182			`s = append(s, "exp_template_html_rcdataescaper")`
183			`case stateAttr:`
184			`// Handled below in delim check.`
185			`case stateAttrName, stateTag:`
186			`c.state = stateAttrName`
187			`s = append(s, "exp_template_html_htmlnamefilter")`
188			`default:`
189			`if isComment(c.state) {`
190			`s = append(s, "exp_template_html_commentescaper")`
191			`} else {`
192			`panic("unexpected state " + c.state.String())`
193			`}`
194			`}`
195			`switch c.delim {`
196			`case delimNone:`
197			`// No extra-escaping needed for raw text content.`
198			`case delimSpaceOrTagEnd:`
199			`s = append(s, "exp_template_html_nospaceescaper")`
200			`default:`
201			`s = append(s, "exp_template_html_attrescaper")`
202			`}`
203			`e.editActionNode(n, s)`
204			`return c`
205			`}`
206
207			`// ensurePipelineContains ensures that the pipeline has commands with`
208			`// the identifiers in s in order.`
209			`// If the pipeline already has some of the sanitizers, do not interfere.`
210			`// For example, if p is (.X \| html) and s is ["escapeJSVal", "html"] then it`
211			`// has one matching, "html", and one to insert, "escapeJSVal", to produce`
212			`// (.X \| escapeJSVal \| html).`
213			`func ensurePipelineContains(p *parse.PipeNode, s []string) {`
214			`if len(s) == 0 {`
215			`return`
216			`}`
217			`n := len(p.Cmds)`
218			`// Find the identifiers at the end of the command chain.`
219			`idents := p.Cmds`
220			`for i := n - 1; i >= 0; i-- {`
221			`if cmd := p.Cmds[i]; len(cmd.Args) != 0 {`
222			`if id, ok := cmd.Args[0].(*parse.IdentifierNode); ok {`
223			`if id.Ident == "noescape" {`
224			`return`
225			`}`
226			`continue`
227			`}`
228			`}`
229			`idents = p.Cmds[i+1:]`
230			`}`
231			`dups := 0`
232			`for _, id := range idents {`
233			`if escFnsEq(s[dups], (id.Args[0].(*parse.IdentifierNode)).Ident) {`
234			`dups++`
235			`if dups == len(s) {`
236			`return`
237			`}`
238			`}`
239			`}`
240			`newCmds := make([]*parse.CommandNode, n-len(idents), n+len(s)-dups)`
241			`copy(newCmds, p.Cmds)`
242			`// Merge existing identifier commands with the sanitizers needed.`
243			`for _, id := range idents {`
244			`i := indexOfStr((id.Args[0].(*parse.IdentifierNode)).Ident, s, escFnsEq)`
245			`if i != -1 {`
246			`for _, name := range s[:i] {`
247			`newCmds = appendCmd(newCmds, newIdentCmd(name))`
248			`}`
249			`s = s[i+1:]`
250			`}`
251			`newCmds = appendCmd(newCmds, id)`
252			`}`
253			`// Create any remaining sanitizers.`
254			`for _, name := range s {`
255			`newCmds = appendCmd(newCmds, newIdentCmd(name))`
256			`}`
257			`p.Cmds = newCmds`
258			`}`
259
260			`// redundantFuncs[a][b] implies that funcMap[b](funcMap[a](x)) == funcMap[a](x)`
261			`// for all x.`
262			`var redundantFuncs = map[string]map[string]bool{`
263			`"exp_template_html_commentescaper": {`
264			`"exp_template_html_attrescaper": true,`
265			`"exp_template_html_nospaceescaper": true,`
266			`"exp_template_html_htmlescaper": true,`
267			`},`
268			`"exp_template_html_cssescaper": {`
269			`"exp_template_html_attrescaper": true,`
270			`},`
271			`"exp_template_html_jsregexpescaper": {`
272			`"exp_template_html_attrescaper": true,`
273			`},`
274			`"exp_template_html_jsstrescaper": {`
275			`"exp_template_html_attrescaper": true,`
276			`},`
277			`"exp_template_html_urlescaper": {`
278			`"exp_template_html_urlnormalizer": true,`
279			`},`
280			`}`
281
282			`// appendCmd appends the given command to the end of the command pipeline`
283			`// unless it is redundant with the last command.`
284			`func appendCmd(cmds []parse.CommandNode, cmd parse.CommandNode) []*parse.CommandNode {`
285			`if n := len(cmds); n != 0 {`
286			`last, ok := cmds[n-1].Args[0].(*parse.IdentifierNode)`
287			`next, _ := cmd.Args[0].(*parse.IdentifierNode)`
288			`if ok && redundantFuncs[last.Ident][next.Ident] {`
289			`return cmds`
290			`}`
291			`}`
292			`return append(cmds, cmd)`
293			`}`
294
295			`// indexOfStr is the first i such that eq(s, strs[i]) or -1 if s was not found.`
296			`func indexOfStr(s string, strs []string, eq func(a, b string) bool) int {`
297			`for i, t := range strs {`
298			`if eq(s, t) {`
299			`return i`
300			`}`
301			`}`
302			`return -1`
303			`}`
304
305			`// escFnsEq returns whether the two escaping functions are equivalent.`
306			`func escFnsEq(a, b string) bool {`
307			`if e := equivEscapers[a]; e != "" {`
308			`a = e`
309			`}`
310			`if e := equivEscapers[b]; e != "" {`
311			`b = e`
312			`}`
313			`return a == b`
314			`}`
315
316			`// newIdentCmd produces a command containing a single identifier node.`
317			`func newIdentCmd(identifier string) *parse.CommandNode {`
318			`return &parse.CommandNode{`
319			`NodeType: parse.NodeCommand,`
320			`Args: []parse.Node{parse.NewIdentifier(identifier)},`
321			`}`
322			`}`
323
324			`// nudge returns the context that would result from following empty string`
325			`// transitions from the input context.`
326			`// For example, parsing:`
327			// `
328			`// will end in context{stateBeforeValue, attrURL}, but parsing one extra rune:`
329			// `
330			`// will end in context{stateURL, delimSpaceOrTagEnd, ...}.`
331			`// There are two transitions that happen when the 'x' is seen:`
332			`// (1) Transition from a before-value state to a start-of-value state without`
333			`// consuming any character.`
334			`// (2) Consume 'x' and transition past the first value character.`
335			`// In this case, nudging produces the context after (1) happens.`
336			`func nudge(c context) context {`
337			`switch c.state {`
338			`case stateTag:`
339			// In `
340			`c.state = stateAttrName`
341			`case stateBeforeValue:`
342			// In `
343			`c.state, c.delim, c.attr = attrStartStates[c.attr], delimSpaceOrTagEnd, attrNone`
344			`case stateAfterName:`
345			// In `
346			`c.state, c.attr = stateAttrName, attrNone`
347			`}`
348			`return c`
349			`}`
350
351			`// join joins the two contexts of a branch template node. The result is an`
352			`// error context if either of the input contexts are error contexts, or if the`
353			`// the input contexts differ.`
354			`func join(a, b context, line int, nodeName string) context {`
355			`if a.state == stateError {`
356			`return a`
357			`}`
358			`if b.state == stateError {`
359			`return b`
360			`}`
361			`if a.eq(b) {`
362			`return a`
363			`}`
364
365			`c := a`
366			`c.urlPart = b.urlPart`
367			`if c.eq(b) {`
368			`// The contexts differ only by urlPart.`
369			`c.urlPart = urlPartUnknown`
370			`return c`
371			`}`
372
373			`c = a`
374			`c.jsCtx = b.jsCtx`
375			`if c.eq(b) {`
376			`// The contexts differ only by jsCtx.`
377			`c.jsCtx = jsCtxUnknown`
378			`return c`
379			`}`
380
381			`// Allow a nudged context to join with an unnudged one.`
382			`// This means that`
383			`//`
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398			`//`
399			`func`
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420			`//`
421			`func`
422
423
424
425
426
427
428
429
430
431			`//`
432			`//`
433			`//`
434			`//`
435			`func`
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467			`//`
468			`func`
469
470
471
472
473
474
475
476			`//`
477			`//`
478			`func`
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516			`//`
517			`//`
518			`func`
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538			`//`
539			`//`
540			`//`
541			`func`
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563			`//`
564			`var`
565
566
567
568
569
570
571
572
573
574
575
576
577			`var`
578
579			`//`
580			`func`
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647			`//`
648			`//`
649			`func`
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700			`//`
701			`func`
702
703
704
705
706
707
708			`//`
709			`func`
710
711
712
713
714
715
716			`//`
717			`func`
718
719
720
721
722
723
724			`//`
725			`//`
726			`func`
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746			`//`
747			`func`
748
749
750
751
752
753