Source file src/pkg/html/template/escape.go
1
2
3
4
5 package template
6
7 import (
8 "bytes"
9 "fmt"
10 "html"
11 "io"
12 "text/template"
13 "text/template/parse"
14 )
15
16
17
18
19
20
21 func escapeTemplate(tmpl *Template, node parse.Node, name string) error {
22 c, _ := tmpl.esc.escapeTree(context{}, node, name, 0)
23 var err error
24 if c.err != nil {
25 err, c.err.Name = c.err, name
26 } else if c.state != stateText {
27 err = &Error{ErrEndContext, nil, name, 0, fmt.Sprintf("ends in a non-text context: %v", c)}
28 }
29 if err != nil {
30
31 if t := tmpl.set[name]; t != nil {
32 t.escapeErr = err
33 t.text.Tree = nil
34 t.Tree = nil
35 }
36 return err
37 }
38 tmpl.esc.commit()
39 if t := tmpl.set[name]; t != nil {
40 t.escapeErr = escapeOK
41 t.Tree = t.text.Tree
42 }
43 return nil
44 }
45
46
47
48 func evalArgs(args ...interface{}) string {
49
50 if len(args) == 1 {
51 if s, ok := args[0].(string); ok {
52 return s
53 }
54 }
55 for i, arg := range args {
56 args[i] = indirectToStringerOrError(arg)
57 }
58 return fmt.Sprint(args...)
59 }
60
61
62 var funcMap = template.FuncMap{
63 "_html_template_attrescaper": attrEscaper,
64 "_html_template_commentescaper": commentEscaper,
65 "_html_template_cssescaper": cssEscaper,
66 "_html_template_cssvaluefilter": cssValueFilter,
67 "_html_template_htmlnamefilter": htmlNameFilter,
68 "_html_template_htmlescaper": htmlEscaper,
69 "_html_template_jsregexpescaper": jsRegexpEscaper,
70 "_html_template_jsstrescaper": jsStrEscaper,
71 "_html_template_jsvalescaper": jsValEscaper,
72 "_html_template_nospaceescaper": htmlNospaceEscaper,
73 "_html_template_rcdataescaper": rcdataEscaper,
74 "_html_template_srcsetescaper": srcsetFilterAndEscaper,
75 "_html_template_urlescaper": urlEscaper,
76 "_html_template_urlfilter": urlFilter,
77 "_html_template_urlnormalizer": urlNormalizer,
78 "_eval_args_": evalArgs,
79 }
80
81
82
83 type escaper struct {
84
85 ns *nameSpace
86
87
88 output map[string]context
89
90
91 derived map[string]*template.Template
92
93 called map[string]bool
94
95
96
97 actionNodeEdits map[*parse.ActionNode][]string
98 templateNodeEdits map[*parse.TemplateNode]string
99 textNodeEdits map[*parse.TextNode][]byte
100 }
101
102
103 func makeEscaper(n *nameSpace) escaper {
104 return escaper{
105 n,
106 map[string]context{},
107 map[string]*template.Template{},
108 map[string]bool{},
109 map[*parse.ActionNode][]string{},
110 map[*parse.TemplateNode]string{},
111 map[*parse.TextNode][]byte{},
112 }
113 }
114
115
116
117
118
119
120 const filterFailsafe = "ZgotmplZ"
121
122
123 func (e *escaper) escape(c context, n parse.Node) context {
124 switch n := n.(type) {
125 case *parse.ActionNode:
126 return e.escapeAction(c, n)
127 case *parse.IfNode:
128 return e.escapeBranch(c, &n.BranchNode, "if")
129 case *parse.ListNode:
130 return e.escapeList(c, n)
131 case *parse.RangeNode:
132 return e.escapeBranch(c, &n.BranchNode, "range")
133 case *parse.TemplateNode:
134 return e.escapeTemplate(c, n)
135 case *parse.TextNode:
136 return e.escapeText(c, n)
137 case *parse.WithNode:
138 return e.escapeBranch(c, &n.BranchNode, "with")
139 }
140 panic("escaping " + n.String() + " is unimplemented")
141 }
142
143
144 func (e *escaper) escapeAction(c context, n *parse.ActionNode) context {
145 if len(n.Pipe.Decl) != 0 {
146
147 return c
148 }
149 c = nudge(c)
150
151 for pos, idNode := range n.Pipe.Cmds {
152 node, ok := idNode.Args[0].(*parse.IdentifierNode)
153 if !ok {
154
155
156
157
158
159
160
161 continue
162 }
163 ident := node.Ident
164 if _, ok := predefinedEscapers[ident]; ok {
165 if pos < len(n.Pipe.Cmds)-1 ||
166 c.state == stateAttr && c.delim == delimSpaceOrTagEnd && ident == "html" {
167 return context{
168 state: stateError,
169 err: errorf(ErrPredefinedEscaper, n, n.Line, "predefined escaper %q disallowed in template", ident),
170 }
171 }
172 }
173 }
174 s := make([]string, 0, 3)
175 switch c.state {
176 case stateError:
177 return c
178 case stateURL, stateCSSDqStr, stateCSSSqStr, stateCSSDqURL, stateCSSSqURL, stateCSSURL:
179 switch c.urlPart {
180 case urlPartNone:
181 s = append(s, "_html_template_urlfilter")
182 fallthrough
183 case urlPartPreQuery:
184 switch c.state {
185 case stateCSSDqStr, stateCSSSqStr:
186 s = append(s, "_html_template_cssescaper")
187 default:
188 s = append(s, "_html_template_urlnormalizer")
189 }
190 case urlPartQueryOrFrag:
191 s = append(s, "_html_template_urlescaper")
192 case urlPartUnknown:
193 return context{
194 state: stateError,
195 err: errorf(ErrAmbigContext, n, n.Line, "%s appears in an ambiguous context within a URL", n),
196 }
197 default:
198 panic(c.urlPart.String())
199 }
200 case stateJS:
201 s = append(s, "_html_template_jsvalescaper")
202
203 c.jsCtx = jsCtxDivOp
204 case stateJSDqStr, stateJSSqStr:
205 s = append(s, "_html_template_jsstrescaper")
206 case stateJSRegexp:
207 s = append(s, "_html_template_jsregexpescaper")
208 case stateCSS:
209 s = append(s, "_html_template_cssvaluefilter")
210 case stateText:
211 s = append(s, "_html_template_htmlescaper")
212 case stateRCDATA:
213 s = append(s, "_html_template_rcdataescaper")
214 case stateAttr:
215
216 case stateAttrName, stateTag:
217 c.state = stateAttrName
218 s = append(s, "_html_template_htmlnamefilter")
219 case stateSrcset:
220 s = append(s, "_html_template_srcsetescaper")
221 default:
222 if isComment(c.state) {
223 s = append(s, "_html_template_commentescaper")
224 } else {
225 panic("unexpected state " + c.state.String())
226 }
227 }
228 switch c.delim {
229 case delimNone:
230
231 case delimSpaceOrTagEnd:
232 s = append(s, "_html_template_nospaceescaper")
233 default:
234 s = append(s, "_html_template_attrescaper")
235 }
236 e.editActionNode(n, s)
237 return c
238 }
239
240
241
242
243 func ensurePipelineContains(p *parse.PipeNode, s []string) {
244 if len(s) == 0 {
245
246 return
247 }
248
249
250
251 pipelineLen := len(p.Cmds)
252 if pipelineLen > 0 {
253 lastCmd := p.Cmds[pipelineLen-1]
254 if idNode, ok := lastCmd.Args[0].(*parse.IdentifierNode); ok {
255 if esc := idNode.Ident; predefinedEscapers[esc] {
256
257 if len(p.Cmds) == 1 && len(lastCmd.Args) > 1 {
258
259
260
261
262
263 lastCmd.Args[0] = parse.NewIdentifier("_eval_args_").SetTree(nil).SetPos(lastCmd.Args[0].Position())
264 p.Cmds = appendCmd(p.Cmds, newIdentCmd(esc, p.Position()))
265 pipelineLen++
266 }
267
268
269 dup := false
270 for i, escaper := range s {
271 if escFnsEq(esc, escaper) {
272 s[i] = idNode.Ident
273 dup = true
274 }
275 }
276 if dup {
277
278
279 pipelineLen--
280 }
281 }
282 }
283 }
284
285 newCmds := make([]*parse.CommandNode, pipelineLen, pipelineLen+len(s))
286 insertedIdents := make(map[string]bool)
287 for i := 0; i < pipelineLen; i++ {
288 cmd := p.Cmds[i]
289 newCmds[i] = cmd
290 if idNode, ok := cmd.Args[0].(*parse.IdentifierNode); ok {
291 insertedIdents[normalizeEscFn(idNode.Ident)] = true
292 }
293 }
294 for _, name := range s {
295 if !insertedIdents[normalizeEscFn(name)] {
296
297
298
299
300 newCmds = appendCmd(newCmds, newIdentCmd(name, p.Position()))
301 }
302 }
303 p.Cmds = newCmds
304 }
305
306
307
308 var predefinedEscapers = map[string]bool{
309 "html": true,
310 "urlquery": true,
311 }
312
313
314
315 var equivEscapers = map[string]string{
316
317
318 "_html_template_attrescaper": "html",
319 "_html_template_htmlescaper": "html",
320 "_html_template_rcdataescaper": "html",
321
322
323
324 "_html_template_urlescaper": "urlquery",
325
326
327
328
329
330
331 "_html_template_urlnormalizer": "urlquery",
332 }
333
334
335 func escFnsEq(a, b string) bool {
336 return normalizeEscFn(a) == normalizeEscFn(b)
337 }
338
339
340
341 func normalizeEscFn(e string) string {
342 if norm := equivEscapers[e]; norm != "" {
343 return norm
344 }
345 return e
346 }
347
348
349
350 var redundantFuncs = map[string]map[string]bool{
351 "_html_template_commentescaper": {
352 "_html_template_attrescaper": true,
353 "_html_template_nospaceescaper": true,
354 "_html_template_htmlescaper": true,
355 },
356 "_html_template_cssescaper": {
357 "_html_template_attrescaper": true,
358 },
359 "_html_template_jsregexpescaper": {
360 "_html_template_attrescaper": true,
361 },
362 "_html_template_jsstrescaper": {
363 "_html_template_attrescaper": true,
364 },
365 "_html_template_urlescaper": {
366 "_html_template_urlnormalizer": true,
367 },
368 }
369
370
371
372 func appendCmd(cmds []*parse.CommandNode, cmd *parse.CommandNode) []*parse.CommandNode {
373 if n := len(cmds); n != 0 {
374 last, okLast := cmds[n-1].Args[0].(*parse.IdentifierNode)
375 next, okNext := cmd.Args[0].(*parse.IdentifierNode)
376 if okLast && okNext && redundantFuncs[last.Ident][next.Ident] {
377 return cmds
378 }
379 }
380 return append(cmds, cmd)
381 }
382
383
384 func newIdentCmd(identifier string, pos parse.Pos) *parse.CommandNode {
385 return &parse.CommandNode{
386 NodeType: parse.NodeCommand,
387 Args: []parse.Node{parse.NewIdentifier(identifier).SetTree(nil).SetPos(pos)},
388 }
389 }
390
391
392
393
394
395
396
397
398
399
400
401
402
403 func nudge(c context) context {
404 switch c.state {
405 case stateTag:
406
407 c.state = stateAttrName
408 case stateBeforeValue:
409
410 c.state, c.delim, c.attr = attrStartStates[c.attr], delimSpaceOrTagEnd, attrNone
411 case stateAfterName:
412
413 c.state, c.attr = stateAttrName, attrNone
414 }
415 return c
416 }
417
418
419
420
421 func join(a, b context, node parse.Node, nodeName string) context {
422 if a.state == stateError {
423 return a
424 }
425 if b.state == stateError {
426 return b
427 }
428 if a.eq(b) {
429 return a
430 }
431
432 c := a
433 c.urlPart = b.urlPart
434 if c.eq(b) {
435
436 c.urlPart = urlPartUnknown
437 return c
438 }
439
440 c = a
441 c.jsCtx = b.jsCtx
442 if c.eq(b) {
443
444 c.jsCtx = jsCtxUnknown
445 return c
446 }
447
448
449
450
451
452
453 if c, d := nudge(a), nudge(b); !(c.eq(a) && d.eq(b)) {
454 if e := join(c, d, node, nodeName); e.state != stateError {
455 return e
456 }
457 }
458
459 return context{
460 state: stateError,
461 err: errorf(ErrBranchEnd, node, 0, "{{%s}} branches end in different contexts: %v, %v", nodeName, a, b),
462 }
463 }
464
465
466 func (e *escaper) escapeBranch(c context, n *parse.BranchNode, nodeName string) context {
467 c0 := e.escapeList(c, n.List)
468 if nodeName == "range" && c0.state != stateError {
469
470
471
472 c1, _ := e.escapeListConditionally(c0, n.List, nil)
473 c0 = join(c0, c1, n, nodeName)
474 if c0.state == stateError {
475
476
477
478 c0.err.Line = n.Line
479 c0.err.Description = "on range loop re-entry: " + c0.err.Description
480 return c0
481 }
482 }
483 c1 := e.escapeList(c, n.ElseList)
484 return join(c0, c1, n, nodeName)
485 }
486
487
488 func (e *escaper) escapeList(c context, n *parse.ListNode) context {
489 if n == nil {
490 return c
491 }
492 for _, m := range n.Nodes {
493 c = e.escape(c, m)
494 }
495 return c
496 }
497
498
499
500
501
502 func (e *escaper) escapeListConditionally(c context, n *parse.ListNode, filter func(*escaper, context) bool) (context, bool) {
503 e1 := makeEscaper(e.ns)
504
505 for k, v := range e.output {
506 e1.output[k] = v
507 }
508 c = e1.escapeList(c, n)
509 ok := filter != nil && filter(&e1, c)
510 if ok {
511
512 for k, v := range e1.output {
513 e.output[k] = v
514 }
515 for k, v := range e1.derived {
516 e.derived[k] = v
517 }
518 for k, v := range e1.called {
519 e.called[k] = v
520 }
521 for k, v := range e1.actionNodeEdits {
522 e.editActionNode(k, v)
523 }
524 for k, v := range e1.templateNodeEdits {
525 e.editTemplateNode(k, v)
526 }
527 for k, v := range e1.textNodeEdits {
528 e.editTextNode(k, v)
529 }
530 }
531 return c, ok
532 }
533
534
535 func (e *escaper) escapeTemplate(c context, n *parse.TemplateNode) context {
536 c, name := e.escapeTree(c, n, n.Name, n.Line)
537 if name != n.Name {
538 e.editTemplateNode(n, name)
539 }
540 return c
541 }
542
543
544
545 func (e *escaper) escapeTree(c context, node parse.Node, name string, line int) (context, string) {
546
547
548 dname := c.mangle(name)
549 e.called[dname] = true
550 if out, ok := e.output[dname]; ok {
551
552 return out, dname
553 }
554 t := e.template(name)
555 if t == nil {
556
557
558 if e.ns.set[name] != nil {
559 return context{
560 state: stateError,
561 err: errorf(ErrNoSuchTemplate, node, line, "%q is an incomplete or empty template", name),
562 }, dname
563 }
564 return context{
565 state: stateError,
566 err: errorf(ErrNoSuchTemplate, node, line, "no such template %q", name),
567 }, dname
568 }
569 if dname != name {
570
571
572 dt := e.template(dname)
573 if dt == nil {
574 dt = template.New(dname)
575 dt.Tree = &parse.Tree{Name: dname, Root: t.Root.CopyList()}
576 e.derived[dname] = dt
577 }
578 t = dt
579 }
580 return e.computeOutCtx(c, t), dname
581 }
582
583
584
585 func (e *escaper) computeOutCtx(c context, t *template.Template) context {
586
587 c1, ok := e.escapeTemplateBody(c, t)
588 if !ok {
589
590 if c2, ok2 := e.escapeTemplateBody(c1, t); ok2 {
591 c1, ok = c2, true
592 }
593
594 }
595 if !ok && c1.state != stateError {
596 return context{
597 state: stateError,
598 err: errorf(ErrOutputContext, t.Tree.Root, 0, "cannot compute output context for template %s", t.Name()),
599 }
600 }
601 return c1
602 }
603
604
605
606
607 func (e *escaper) escapeTemplateBody(c context, t *template.Template) (context, bool) {
608 filter := func(e1 *escaper, c1 context) bool {
609 if c1.state == stateError {
610
611 return false
612 }
613 if !e1.called[t.Name()] {
614
615
616 return true
617 }
618
619 return c.eq(c1)
620 }
621
622
623
624
625 e.output[t.Name()] = c
626 return e.escapeListConditionally(c, t.Tree.Root, filter)
627 }
628
629
630 var delimEnds = [...]string{
631 delimDoubleQuote: `"`,
632 delimSingleQuote: "'",
633
634
635
636
637
638
639
640 delimSpaceOrTagEnd: " \t\n\f\r>",
641 }
642
643 var doctypeBytes = []byte("<!DOCTYPE")
644
645
646 func (e *escaper) escapeText(c context, n *parse.TextNode) context {
647 s, written, i, b := n.Text, 0, 0, new(bytes.Buffer)
648 for i != len(s) {
649 c1, nread := contextAfterText(c, s[i:])
650 i1 := i + nread
651 if c.state == stateText || c.state == stateRCDATA {
652 end := i1
653 if c1.state != c.state {
654 for j := end - 1; j >= i; j-- {
655 if s[j] == '<' {
656 end = j
657 break
658 }
659 }
660 }
661 for j := i; j < end; j++ {
662 if s[j] == '<' && !bytes.HasPrefix(bytes.ToUpper(s[j:]), doctypeBytes) {
663 b.Write(s[written:j])
664 b.WriteString("<")
665 written = j + 1
666 }
667 }
668 } else if isComment(c.state) && c.delim == delimNone {
669 switch c.state {
670 case stateJSBlockCmt:
671
672
673
674
675
676
677
678 if bytes.ContainsAny(s[written:i1], "\n\r\u2028\u2029") {
679 b.WriteByte('\n')
680 } else {
681 b.WriteByte(' ')
682 }
683 case stateCSSBlockCmt:
684 b.WriteByte(' ')
685 }
686 written = i1
687 }
688 if c.state != c1.state && isComment(c1.state) && c1.delim == delimNone {
689
690 cs := i1 - 2
691 if c1.state == stateHTMLCmt {
692
693 cs -= 2
694 }
695 b.Write(s[written:cs])
696 written = i1
697 }
698 if i == i1 && c.state == c1.state {
699 panic(fmt.Sprintf("infinite loop from %v to %v on %q..%q", c, c1, s[:i], s[i:]))
700 }
701 c, i = c1, i1
702 }
703
704 if written != 0 && c.state != stateError {
705 if !isComment(c.state) || c.delim != delimNone {
706 b.Write(n.Text[written:])
707 }
708 e.editTextNode(n, b.Bytes())
709 }
710 return c
711 }
712
713
714
715 func contextAfterText(c context, s []byte) (context, int) {
716 if c.delim == delimNone {
717 c1, i := tSpecialTagEnd(c, s)
718 if i == 0 {
719
720
721 return c1, 0
722 }
723
724 return transitionFunc[c.state](c, s[:i])
725 }
726
727
728
729 i := bytes.IndexAny(s, delimEnds[c.delim])
730 if i == -1 {
731 i = len(s)
732 }
733 if c.delim == delimSpaceOrTagEnd {
734
735
736
737
738
739
740
741 if j := bytes.IndexAny(s[:i], "\"'<=`"); j >= 0 {
742 return context{
743 state: stateError,
744 err: errorf(ErrBadHTML, nil, 0, "%q in unquoted attr: %q", s[j:j+1], s[:i]),
745 }, len(s)
746 }
747 }
748 if i == len(s) {
749
750
751
752
753 for u := []byte(html.UnescapeString(string(s))); len(u) != 0; {
754 c1, i1 := transitionFunc[c.state](c, u)
755 c, u = c1, u[i1:]
756 }
757 return c, len(s)
758 }
759
760 element := c.element
761
762
763 if c.state == stateAttr && c.element == elementScript && c.attr == attrScriptType && !isJSType(string(s[:i])) {
764 element = elementNone
765 }
766
767 if c.delim != delimSpaceOrTagEnd {
768
769 i++
770 }
771
772
773 return context{state: stateTag, element: element}, i
774 }
775
776
777 func (e *escaper) editActionNode(n *parse.ActionNode, cmds []string) {
778 if _, ok := e.actionNodeEdits[n]; ok {
779 panic(fmt.Sprintf("node %s shared between templates", n))
780 }
781 e.actionNodeEdits[n] = cmds
782 }
783
784
785 func (e *escaper) editTemplateNode(n *parse.TemplateNode, callee string) {
786 if _, ok := e.templateNodeEdits[n]; ok {
787 panic(fmt.Sprintf("node %s shared between templates", n))
788 }
789 e.templateNodeEdits[n] = callee
790 }
791
792
793 func (e *escaper) editTextNode(n *parse.TextNode, text []byte) {
794 if _, ok := e.textNodeEdits[n]; ok {
795 panic(fmt.Sprintf("node %s shared between templates", n))
796 }
797 e.textNodeEdits[n] = text
798 }
799
800
801
802 func (e *escaper) commit() {
803 for name := range e.output {
804 e.template(name).Funcs(funcMap)
805 }
806
807
808 tmpl := e.arbitraryTemplate()
809 for _, t := range e.derived {
810 if _, err := tmpl.text.AddParseTree(t.Name(), t.Tree); err != nil {
811 panic("error adding derived template")
812 }
813 }
814 for n, s := range e.actionNodeEdits {
815 ensurePipelineContains(n.Pipe, s)
816 }
817 for n, name := range e.templateNodeEdits {
818 n.Name = name
819 }
820 for n, s := range e.textNodeEdits {
821 n.Text = s
822 }
823
824
825 e.called = make(map[string]bool)
826 e.actionNodeEdits = make(map[*parse.ActionNode][]string)
827 e.templateNodeEdits = make(map[*parse.TemplateNode]string)
828 e.textNodeEdits = make(map[*parse.TextNode][]byte)
829 }
830
831
832 func (e *escaper) template(name string) *template.Template {
833
834
835 t := e.arbitraryTemplate().text.Lookup(name)
836 if t == nil {
837 t = e.derived[name]
838 }
839 return t
840 }
841
842
843
844 func (e *escaper) arbitraryTemplate() *Template {
845 for _, t := range e.ns.set {
846 return t
847 }
848 panic("no templates in name space")
849 }
850
851
852
853
854
855 func HTMLEscape(w io.Writer, b []byte) {
856 template.HTMLEscape(w, b)
857 }
858
859
860 func HTMLEscapeString(s string) string {
861 return template.HTMLEscapeString(s)
862 }
863
864
865
866 func HTMLEscaper(args ...interface{}) string {
867 return template.HTMLEscaper(args...)
868 }
869
870
871 func JSEscape(w io.Writer, b []byte) {
872 template.JSEscape(w, b)
873 }
874
875
876 func JSEscapeString(s string) string {
877 return template.JSEscapeString(s)
878 }
879
880
881
882 func JSEscaper(args ...interface{}) string {
883 return template.JSEscaper(args...)
884 }
885
886
887
888 func URLQueryEscaper(args ...interface{}) string {
889 return template.URLQueryEscaper(args...)
890 }
891
View as plain text