compile.go 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. // Copyright (C) 2016 Kohei YOSHIDA. All rights reserved.
  2. //
  3. // This program is free software; you can redistribute it and/or
  4. // modify it under the terms of The BSD 3-Clause License
  5. // that can be found in the LICENSE file.
  6. package uritemplate
  7. import (
  8. "fmt"
  9. "unicode/utf8"
  10. )
  11. type compiler struct {
  12. prog *prog
  13. }
  14. func (c *compiler) init() {
  15. c.prog = &prog{}
  16. }
  17. func (c *compiler) op(opcode progOpcode) uint32 {
  18. i := len(c.prog.op)
  19. c.prog.op = append(c.prog.op, progOp{code: opcode})
  20. return uint32(i)
  21. }
  22. func (c *compiler) opWithRune(opcode progOpcode, r rune) uint32 {
  23. addr := c.op(opcode)
  24. (&c.prog.op[addr]).r = r
  25. return addr
  26. }
  27. func (c *compiler) opWithRuneClass(opcode progOpcode, rc runeClass) uint32 {
  28. addr := c.op(opcode)
  29. (&c.prog.op[addr]).rc = rc
  30. return addr
  31. }
  32. func (c *compiler) opWithAddr(opcode progOpcode, absaddr uint32) uint32 {
  33. addr := c.op(opcode)
  34. (&c.prog.op[addr]).i = absaddr
  35. return addr
  36. }
  37. func (c *compiler) opWithAddrDelta(opcode progOpcode, delta uint32) uint32 {
  38. return c.opWithAddr(opcode, uint32(len(c.prog.op))+delta)
  39. }
  40. func (c *compiler) opWithName(opcode progOpcode, name string) uint32 {
  41. addr := c.op(opcode)
  42. (&c.prog.op[addr]).name = name
  43. return addr
  44. }
  45. func (c *compiler) compileString(str string) {
  46. for i := 0; i < len(str); {
  47. // NOTE(yosida95): It is confirmed at parse time that literals
  48. // consist of only valid-UTF8 runes.
  49. r, size := utf8.DecodeRuneInString(str[i:])
  50. c.opWithRune(opRune, r)
  51. i += size
  52. }
  53. }
  54. func (c *compiler) compileRuneClass(rc runeClass, maxlen int) {
  55. for i := 0; i < maxlen; i++ {
  56. if i > 0 {
  57. c.opWithAddrDelta(opSplit, 7)
  58. }
  59. c.opWithAddrDelta(opSplit, 3) // raw rune or pct-encoded
  60. c.opWithRuneClass(opRuneClass, rc) // raw rune
  61. c.opWithAddrDelta(opJmp, 4) //
  62. c.opWithRune(opRune, '%') // pct-encoded
  63. c.opWithRuneClass(opRuneClass, runeClassPctE) //
  64. c.opWithRuneClass(opRuneClass, runeClassPctE) //
  65. }
  66. }
  67. func (c *compiler) compileRuneClassInfinite(rc runeClass) {
  68. start := c.opWithAddrDelta(opSplit, 3) // raw rune or pct-encoded
  69. c.opWithRuneClass(opRuneClass, rc) // raw rune
  70. c.opWithAddrDelta(opJmp, 4) //
  71. c.opWithRune(opRune, '%') // pct-encoded
  72. c.opWithRuneClass(opRuneClass, runeClassPctE) //
  73. c.opWithRuneClass(opRuneClass, runeClassPctE) //
  74. c.opWithAddrDelta(opSplit, 2) // loop
  75. c.opWithAddr(opJmp, start) //
  76. }
  77. func (c *compiler) compileVarspecValue(spec varspec, expr *expression) {
  78. var specname string
  79. if spec.maxlen > 0 {
  80. specname = fmt.Sprintf("%s:%d", spec.name, spec.maxlen)
  81. } else {
  82. specname = spec.name
  83. }
  84. c.prog.numCap++
  85. c.opWithName(opCapStart, specname)
  86. split := c.op(opSplit)
  87. if spec.maxlen > 0 {
  88. c.compileRuneClass(expr.allow, spec.maxlen)
  89. } else {
  90. c.compileRuneClassInfinite(expr.allow)
  91. }
  92. capEnd := c.opWithName(opCapEnd, specname)
  93. c.prog.op[split].i = capEnd
  94. }
  95. func (c *compiler) compileVarspec(spec varspec, expr *expression) {
  96. switch {
  97. case expr.named && spec.explode:
  98. split1 := c.op(opSplit)
  99. noop := c.op(opNoop)
  100. c.compileString(spec.name)
  101. split2 := c.op(opSplit)
  102. c.opWithRune(opRune, '=')
  103. c.compileVarspecValue(spec, expr)
  104. split3 := c.op(opSplit)
  105. c.compileString(expr.sep)
  106. c.opWithAddr(opJmp, noop)
  107. c.prog.op[split2].i = uint32(len(c.prog.op))
  108. c.compileString(expr.ifemp)
  109. c.opWithAddr(opJmp, split3)
  110. c.prog.op[split1].i = uint32(len(c.prog.op))
  111. c.prog.op[split3].i = uint32(len(c.prog.op))
  112. case expr.named && !spec.explode:
  113. c.compileString(spec.name)
  114. split2 := c.op(opSplit)
  115. c.opWithRune(opRune, '=')
  116. split3 := c.op(opSplit)
  117. split4 := c.op(opSplit)
  118. c.compileVarspecValue(spec, expr)
  119. split5 := c.op(opSplit)
  120. c.prog.op[split4].i = split5
  121. c.compileString(",")
  122. c.opWithAddr(opJmp, split4)
  123. c.prog.op[split3].i = uint32(len(c.prog.op))
  124. c.compileString(",")
  125. jmp1 := c.op(opJmp)
  126. c.prog.op[split2].i = uint32(len(c.prog.op))
  127. c.compileString(expr.ifemp)
  128. c.prog.op[split5].i = uint32(len(c.prog.op))
  129. c.prog.op[jmp1].i = uint32(len(c.prog.op))
  130. case !expr.named:
  131. start := uint32(len(c.prog.op))
  132. c.compileVarspecValue(spec, expr)
  133. split1 := c.op(opSplit)
  134. jmp := c.op(opJmp)
  135. c.prog.op[split1].i = uint32(len(c.prog.op))
  136. if spec.explode {
  137. c.compileString(expr.sep)
  138. } else {
  139. c.opWithRune(opRune, ',')
  140. }
  141. c.opWithAddr(opJmp, start)
  142. c.prog.op[jmp].i = uint32(len(c.prog.op))
  143. }
  144. }
  145. func (c *compiler) compileExpression(expr *expression) {
  146. if len(expr.vars) < 1 {
  147. return
  148. }
  149. split1 := c.op(opSplit)
  150. c.compileString(expr.first)
  151. for i, size := 0, len(expr.vars); i < size; i++ {
  152. spec := expr.vars[i]
  153. split2 := c.op(opSplit)
  154. if i > 0 {
  155. split3 := c.op(opSplit)
  156. c.compileString(expr.sep)
  157. c.prog.op[split3].i = uint32(len(c.prog.op))
  158. }
  159. c.compileVarspec(spec, expr)
  160. c.prog.op[split2].i = uint32(len(c.prog.op))
  161. }
  162. c.prog.op[split1].i = uint32(len(c.prog.op))
  163. }
  164. func (c *compiler) compileLiterals(lt literals) {
  165. c.compileString(string(lt))
  166. }
  167. func (c *compiler) compile(tmpl *Template) {
  168. c.op(opLineBegin)
  169. for i := range tmpl.exprs {
  170. expr := tmpl.exprs[i]
  171. switch expr := expr.(type) {
  172. default:
  173. panic("unhandled expression")
  174. case *expression:
  175. c.compileExpression(expr)
  176. case literals:
  177. c.compileLiterals(expr)
  178. }
  179. }
  180. c.op(opLineEnd)
  181. c.op(opEnd)
  182. }