text_encoder.go 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249
  1. package pdf417
  2. import "fmt"
  3. // Since each code word consists of 2 characters, a padding value is
  4. // needed when encoding a single character. 29 is used as padding because
  5. // it's a switch in all 4 submodes, and doesn't add any data.
  6. const padding_value = 29
  7. type subMode byte
  8. const (
  9. subUpper subMode = iota
  10. subLower
  11. subMixed
  12. subPunct
  13. )
  14. const (
  15. switchUpper = '\u00f1'
  16. switchUpperSingle = '\u00f2'
  17. switchLower = '\u00f3'
  18. switchMixed = '\u00f4'
  19. switchPunct = '\u00f5'
  20. switchPunctSingle = '\u00f6'
  21. )
  22. type textEncoder struct {
  23. Switching map[subMode]map[subMode][]rune
  24. SwitchSubmode map[rune]subMode
  25. ReverseLookup map[rune]map[subMode]int
  26. }
  27. func newTextEncoder() *textEncoder {
  28. encoder := new(textEncoder)
  29. characterTables := map[subMode][]rune{
  30. subUpper: []rune{
  31. 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',
  32. 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R',
  33. 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', ' ',
  34. switchLower,
  35. switchMixed,
  36. switchPunctSingle,
  37. },
  38. subLower: []rune{
  39. 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i',
  40. 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r',
  41. 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', ' ',
  42. switchUpperSingle,
  43. switchMixed,
  44. switchPunctSingle,
  45. },
  46. subMixed: []rune{
  47. '0', '1', '2', '3', '4', '5', '6', '7', '8',
  48. '9', '&', '\r', '\t', ',', ':', '#', '-', '.',
  49. '$', '/', '+', '%', '*', '=', '^',
  50. switchPunct, ' ',
  51. switchLower,
  52. switchUpper,
  53. switchPunctSingle,
  54. },
  55. subPunct: []rune{
  56. ';', '<', '>', '@', '[', '\\', ']', '_', '`',
  57. '~', '!', '\r', '\t', ',', ':', '\n', '-', '.',
  58. '$', '/', 'g', '|', '*', '(', ')', '?', '{', '}', '\'',
  59. switchUpper,
  60. },
  61. }
  62. encoder.Switching = map[subMode]map[subMode][]rune{
  63. subUpper: map[subMode][]rune{
  64. subLower: []rune{switchLower},
  65. subMixed: []rune{switchMixed},
  66. subPunct: []rune{switchMixed, switchPunct},
  67. },
  68. subLower: map[subMode][]rune{
  69. subUpper: []rune{switchMixed, switchUpper},
  70. subMixed: []rune{switchMixed},
  71. subPunct: []rune{switchMixed, switchPunct},
  72. },
  73. subMixed: map[subMode][]rune{
  74. subUpper: []rune{switchUpper},
  75. subLower: []rune{switchLower},
  76. subPunct: []rune{switchPunct},
  77. },
  78. subPunct: map[subMode][]rune{
  79. subUpper: []rune{switchUpper},
  80. subLower: []rune{switchUpper, switchLower},
  81. subMixed: []rune{switchUpper, switchMixed},
  82. },
  83. }
  84. encoder.SwitchSubmode = map[rune]subMode{
  85. switchUpper: subUpper,
  86. switchLower: subLower,
  87. switchPunct: subPunct,
  88. switchMixed: subMixed,
  89. }
  90. encoder.ReverseLookup = make(map[rune]map[subMode]int)
  91. for submode, codes := range characterTables {
  92. for row, char := range codes {
  93. if encoder.ReverseLookup[char] == nil {
  94. encoder.ReverseLookup[char] = make(map[subMode]int)
  95. }
  96. encoder.ReverseLookup[char][submode] = int(row)
  97. }
  98. }
  99. return encoder
  100. }
  101. func (encoder *textEncoder) CanEncode(char rune) bool {
  102. switch char {
  103. case switchUpper,
  104. switchUpperSingle,
  105. switchLower,
  106. switchMixed,
  107. switchPunct,
  108. switchPunctSingle:
  109. return false
  110. default:
  111. return encoder.ReverseLookup[char] != nil
  112. }
  113. }
  114. func (*textEncoder) GetSwitchCode(data string) int {
  115. return switchCodeText
  116. }
  117. func (encoder *textEncoder) Encode(data string) ([]int, error) {
  118. interim, err := encoder.encodeInterim(data)
  119. if err != nil {
  120. return interim, err
  121. }
  122. return encoder.encodeFinal(interim), nil
  123. }
  124. func (encoder *textEncoder) encodeInterim(data string) ([]int, error) {
  125. submode := subUpper
  126. codes := []int{}
  127. var err error
  128. for _, char := range data {
  129. if !encoder.existsInSubmode(char, submode) {
  130. prevSubmode := submode
  131. submode, err = encoder.getSubmode(char)
  132. if err != nil {
  133. return codes, err
  134. }
  135. switchCodes := encoder.getSwitchCodes(prevSubmode, submode)
  136. codes = append(codes, switchCodes...)
  137. }
  138. codes = append(
  139. codes,
  140. encoder.getCharacterCode(char, submode),
  141. )
  142. }
  143. return codes, nil
  144. }
  145. func (encoder *textEncoder) getSubmode(char rune) (subMode, error) {
  146. if lookup, ok := encoder.ReverseLookup[char]; ok {
  147. for key := range lookup {
  148. return key, nil
  149. }
  150. }
  151. return subLower, fmt.Errorf("unable to find submode for %q", char)
  152. }
  153. func (encoder *textEncoder) getSwitchCodes(from, to subMode) []int {
  154. switches := encoder.Switching[from][to]
  155. codes := []int{}
  156. for _, switcher := range switches {
  157. codes = append(codes, encoder.getCharacterCode(switcher, from))
  158. from = encoder.SwitchSubmode[switcher]
  159. }
  160. return codes
  161. }
  162. func (*textEncoder) encodeFinal(codes []int) []int {
  163. codeWords := []int{}
  164. chunks := [][]int{}
  165. chunkPart := []int{}
  166. i := 0
  167. for _, code := range codes {
  168. chunkPart = append(chunkPart, code)
  169. i++
  170. if i%2 == 0 {
  171. chunks = append(chunks, chunkPart)
  172. chunkPart = []int{}
  173. }
  174. }
  175. if len(chunkPart) > 0 {
  176. chunks = append(chunks, chunkPart)
  177. }
  178. for _, chunk := range chunks {
  179. if len(chunk) == 1 {
  180. chunk = append(chunk, padding_value)
  181. }
  182. codeWords = append(
  183. codeWords,
  184. 30*chunk[0]+chunk[1],
  185. )
  186. }
  187. return codeWords
  188. }
  189. func (encoder *textEncoder) getCharacterCode(char rune, submode subMode) int {
  190. cw, ok := encoder.ReverseLookup[char][submode]
  191. if !ok {
  192. panic("This is not possible")
  193. }
  194. return cw
  195. }
  196. func (encoder *textEncoder) existsInSubmode(char rune, submode subMode) bool {
  197. _, ok := encoder.ReverseLookup[char][submode]
  198. return ok
  199. }