salsa208.go 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201
  1. // Copyright 2012 The Go Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. package salsa
  5. import "math/bits"
  6. // Core208 applies the Salsa20/8 core function to the 64-byte array in and puts
  7. // the result into the 64-byte array out. The input and output may be the same array.
  8. func Core208(out *[64]byte, in *[64]byte) {
  9. j0 := uint32(in[0]) | uint32(in[1])<<8 | uint32(in[2])<<16 | uint32(in[3])<<24
  10. j1 := uint32(in[4]) | uint32(in[5])<<8 | uint32(in[6])<<16 | uint32(in[7])<<24
  11. j2 := uint32(in[8]) | uint32(in[9])<<8 | uint32(in[10])<<16 | uint32(in[11])<<24
  12. j3 := uint32(in[12]) | uint32(in[13])<<8 | uint32(in[14])<<16 | uint32(in[15])<<24
  13. j4 := uint32(in[16]) | uint32(in[17])<<8 | uint32(in[18])<<16 | uint32(in[19])<<24
  14. j5 := uint32(in[20]) | uint32(in[21])<<8 | uint32(in[22])<<16 | uint32(in[23])<<24
  15. j6 := uint32(in[24]) | uint32(in[25])<<8 | uint32(in[26])<<16 | uint32(in[27])<<24
  16. j7 := uint32(in[28]) | uint32(in[29])<<8 | uint32(in[30])<<16 | uint32(in[31])<<24
  17. j8 := uint32(in[32]) | uint32(in[33])<<8 | uint32(in[34])<<16 | uint32(in[35])<<24
  18. j9 := uint32(in[36]) | uint32(in[37])<<8 | uint32(in[38])<<16 | uint32(in[39])<<24
  19. j10 := uint32(in[40]) | uint32(in[41])<<8 | uint32(in[42])<<16 | uint32(in[43])<<24
  20. j11 := uint32(in[44]) | uint32(in[45])<<8 | uint32(in[46])<<16 | uint32(in[47])<<24
  21. j12 := uint32(in[48]) | uint32(in[49])<<8 | uint32(in[50])<<16 | uint32(in[51])<<24
  22. j13 := uint32(in[52]) | uint32(in[53])<<8 | uint32(in[54])<<16 | uint32(in[55])<<24
  23. j14 := uint32(in[56]) | uint32(in[57])<<8 | uint32(in[58])<<16 | uint32(in[59])<<24
  24. j15 := uint32(in[60]) | uint32(in[61])<<8 | uint32(in[62])<<16 | uint32(in[63])<<24
  25. x0, x1, x2, x3, x4, x5, x6, x7, x8 := j0, j1, j2, j3, j4, j5, j6, j7, j8
  26. x9, x10, x11, x12, x13, x14, x15 := j9, j10, j11, j12, j13, j14, j15
  27. for i := 0; i < 8; i += 2 {
  28. u := x0 + x12
  29. x4 ^= bits.RotateLeft32(u, 7)
  30. u = x4 + x0
  31. x8 ^= bits.RotateLeft32(u, 9)
  32. u = x8 + x4
  33. x12 ^= bits.RotateLeft32(u, 13)
  34. u = x12 + x8
  35. x0 ^= bits.RotateLeft32(u, 18)
  36. u = x5 + x1
  37. x9 ^= bits.RotateLeft32(u, 7)
  38. u = x9 + x5
  39. x13 ^= bits.RotateLeft32(u, 9)
  40. u = x13 + x9
  41. x1 ^= bits.RotateLeft32(u, 13)
  42. u = x1 + x13
  43. x5 ^= bits.RotateLeft32(u, 18)
  44. u = x10 + x6
  45. x14 ^= bits.RotateLeft32(u, 7)
  46. u = x14 + x10
  47. x2 ^= bits.RotateLeft32(u, 9)
  48. u = x2 + x14
  49. x6 ^= bits.RotateLeft32(u, 13)
  50. u = x6 + x2
  51. x10 ^= bits.RotateLeft32(u, 18)
  52. u = x15 + x11
  53. x3 ^= bits.RotateLeft32(u, 7)
  54. u = x3 + x15
  55. x7 ^= bits.RotateLeft32(u, 9)
  56. u = x7 + x3
  57. x11 ^= bits.RotateLeft32(u, 13)
  58. u = x11 + x7
  59. x15 ^= bits.RotateLeft32(u, 18)
  60. u = x0 + x3
  61. x1 ^= bits.RotateLeft32(u, 7)
  62. u = x1 + x0
  63. x2 ^= bits.RotateLeft32(u, 9)
  64. u = x2 + x1
  65. x3 ^= bits.RotateLeft32(u, 13)
  66. u = x3 + x2
  67. x0 ^= bits.RotateLeft32(u, 18)
  68. u = x5 + x4
  69. x6 ^= bits.RotateLeft32(u, 7)
  70. u = x6 + x5
  71. x7 ^= bits.RotateLeft32(u, 9)
  72. u = x7 + x6
  73. x4 ^= bits.RotateLeft32(u, 13)
  74. u = x4 + x7
  75. x5 ^= bits.RotateLeft32(u, 18)
  76. u = x10 + x9
  77. x11 ^= bits.RotateLeft32(u, 7)
  78. u = x11 + x10
  79. x8 ^= bits.RotateLeft32(u, 9)
  80. u = x8 + x11
  81. x9 ^= bits.RotateLeft32(u, 13)
  82. u = x9 + x8
  83. x10 ^= bits.RotateLeft32(u, 18)
  84. u = x15 + x14
  85. x12 ^= bits.RotateLeft32(u, 7)
  86. u = x12 + x15
  87. x13 ^= bits.RotateLeft32(u, 9)
  88. u = x13 + x12
  89. x14 ^= bits.RotateLeft32(u, 13)
  90. u = x14 + x13
  91. x15 ^= bits.RotateLeft32(u, 18)
  92. }
  93. x0 += j0
  94. x1 += j1
  95. x2 += j2
  96. x3 += j3
  97. x4 += j4
  98. x5 += j5
  99. x6 += j6
  100. x7 += j7
  101. x8 += j8
  102. x9 += j9
  103. x10 += j10
  104. x11 += j11
  105. x12 += j12
  106. x13 += j13
  107. x14 += j14
  108. x15 += j15
  109. out[0] = byte(x0)
  110. out[1] = byte(x0 >> 8)
  111. out[2] = byte(x0 >> 16)
  112. out[3] = byte(x0 >> 24)
  113. out[4] = byte(x1)
  114. out[5] = byte(x1 >> 8)
  115. out[6] = byte(x1 >> 16)
  116. out[7] = byte(x1 >> 24)
  117. out[8] = byte(x2)
  118. out[9] = byte(x2 >> 8)
  119. out[10] = byte(x2 >> 16)
  120. out[11] = byte(x2 >> 24)
  121. out[12] = byte(x3)
  122. out[13] = byte(x3 >> 8)
  123. out[14] = byte(x3 >> 16)
  124. out[15] = byte(x3 >> 24)
  125. out[16] = byte(x4)
  126. out[17] = byte(x4 >> 8)
  127. out[18] = byte(x4 >> 16)
  128. out[19] = byte(x4 >> 24)
  129. out[20] = byte(x5)
  130. out[21] = byte(x5 >> 8)
  131. out[22] = byte(x5 >> 16)
  132. out[23] = byte(x5 >> 24)
  133. out[24] = byte(x6)
  134. out[25] = byte(x6 >> 8)
  135. out[26] = byte(x6 >> 16)
  136. out[27] = byte(x6 >> 24)
  137. out[28] = byte(x7)
  138. out[29] = byte(x7 >> 8)
  139. out[30] = byte(x7 >> 16)
  140. out[31] = byte(x7 >> 24)
  141. out[32] = byte(x8)
  142. out[33] = byte(x8 >> 8)
  143. out[34] = byte(x8 >> 16)
  144. out[35] = byte(x8 >> 24)
  145. out[36] = byte(x9)
  146. out[37] = byte(x9 >> 8)
  147. out[38] = byte(x9 >> 16)
  148. out[39] = byte(x9 >> 24)
  149. out[40] = byte(x10)
  150. out[41] = byte(x10 >> 8)
  151. out[42] = byte(x10 >> 16)
  152. out[43] = byte(x10 >> 24)
  153. out[44] = byte(x11)
  154. out[45] = byte(x11 >> 8)
  155. out[46] = byte(x11 >> 16)
  156. out[47] = byte(x11 >> 24)
  157. out[48] = byte(x12)
  158. out[49] = byte(x12 >> 8)
  159. out[50] = byte(x12 >> 16)
  160. out[51] = byte(x12 >> 24)
  161. out[52] = byte(x13)
  162. out[53] = byte(x13 >> 8)
  163. out[54] = byte(x13 >> 16)
  164. out[55] = byte(x13 >> 24)
  165. out[56] = byte(x14)
  166. out[57] = byte(x14 >> 8)
  167. out[58] = byte(x14 >> 16)
  168. out[59] = byte(x14 >> 24)
  169. out[60] = byte(x15)
  170. out[61] = byte(x15 >> 8)
  171. out[62] = byte(x15 >> 16)
  172. out[63] = byte(x15 >> 24)
  173. }