collations.go 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266
  1. // Go MySQL Driver - A MySQL-Driver for Go's database/sql package
  2. //
  3. // Copyright 2014 The Go-MySQL-Driver Authors. All rights reserved.
  4. //
  5. // This Source Code Form is subject to the terms of the Mozilla Public
  6. // License, v. 2.0. If a copy of the MPL was not distributed with this file,
  7. // You can obtain one at http://mozilla.org/MPL/2.0/.
  8. package mysql
  9. const defaultCollation = "utf8mb4_general_ci"
  10. const binaryCollationID = 63
  11. // A list of available collations mapped to the internal ID.
  12. // To update this map use the following MySQL query:
  13. //
  14. // SELECT COLLATION_NAME, ID FROM information_schema.COLLATIONS WHERE ID<256 ORDER BY ID
  15. //
  16. // Handshake packet have only 1 byte for collation_id. So we can't use collations with ID > 255.
  17. //
  18. // ucs2, utf16, and utf32 can't be used for connection charset.
  19. // https://dev.mysql.com/doc/refman/5.7/en/charset-connection.html#charset-connection-impermissible-client-charset
  20. // They are commented out to reduce this map.
  21. var collations = map[string]byte{
  22. "big5_chinese_ci": 1,
  23. "latin2_czech_cs": 2,
  24. "dec8_swedish_ci": 3,
  25. "cp850_general_ci": 4,
  26. "latin1_german1_ci": 5,
  27. "hp8_english_ci": 6,
  28. "koi8r_general_ci": 7,
  29. "latin1_swedish_ci": 8,
  30. "latin2_general_ci": 9,
  31. "swe7_swedish_ci": 10,
  32. "ascii_general_ci": 11,
  33. "ujis_japanese_ci": 12,
  34. "sjis_japanese_ci": 13,
  35. "cp1251_bulgarian_ci": 14,
  36. "latin1_danish_ci": 15,
  37. "hebrew_general_ci": 16,
  38. "tis620_thai_ci": 18,
  39. "euckr_korean_ci": 19,
  40. "latin7_estonian_cs": 20,
  41. "latin2_hungarian_ci": 21,
  42. "koi8u_general_ci": 22,
  43. "cp1251_ukrainian_ci": 23,
  44. "gb2312_chinese_ci": 24,
  45. "greek_general_ci": 25,
  46. "cp1250_general_ci": 26,
  47. "latin2_croatian_ci": 27,
  48. "gbk_chinese_ci": 28,
  49. "cp1257_lithuanian_ci": 29,
  50. "latin5_turkish_ci": 30,
  51. "latin1_german2_ci": 31,
  52. "armscii8_general_ci": 32,
  53. "utf8_general_ci": 33,
  54. "cp1250_czech_cs": 34,
  55. //"ucs2_general_ci": 35,
  56. "cp866_general_ci": 36,
  57. "keybcs2_general_ci": 37,
  58. "macce_general_ci": 38,
  59. "macroman_general_ci": 39,
  60. "cp852_general_ci": 40,
  61. "latin7_general_ci": 41,
  62. "latin7_general_cs": 42,
  63. "macce_bin": 43,
  64. "cp1250_croatian_ci": 44,
  65. "utf8mb4_general_ci": 45,
  66. "utf8mb4_bin": 46,
  67. "latin1_bin": 47,
  68. "latin1_general_ci": 48,
  69. "latin1_general_cs": 49,
  70. "cp1251_bin": 50,
  71. "cp1251_general_ci": 51,
  72. "cp1251_general_cs": 52,
  73. "macroman_bin": 53,
  74. //"utf16_general_ci": 54,
  75. //"utf16_bin": 55,
  76. //"utf16le_general_ci": 56,
  77. "cp1256_general_ci": 57,
  78. "cp1257_bin": 58,
  79. "cp1257_general_ci": 59,
  80. //"utf32_general_ci": 60,
  81. //"utf32_bin": 61,
  82. //"utf16le_bin": 62,
  83. "binary": 63,
  84. "armscii8_bin": 64,
  85. "ascii_bin": 65,
  86. "cp1250_bin": 66,
  87. "cp1256_bin": 67,
  88. "cp866_bin": 68,
  89. "dec8_bin": 69,
  90. "greek_bin": 70,
  91. "hebrew_bin": 71,
  92. "hp8_bin": 72,
  93. "keybcs2_bin": 73,
  94. "koi8r_bin": 74,
  95. "koi8u_bin": 75,
  96. "utf8_tolower_ci": 76,
  97. "latin2_bin": 77,
  98. "latin5_bin": 78,
  99. "latin7_bin": 79,
  100. "cp850_bin": 80,
  101. "cp852_bin": 81,
  102. "swe7_bin": 82,
  103. "utf8_bin": 83,
  104. "big5_bin": 84,
  105. "euckr_bin": 85,
  106. "gb2312_bin": 86,
  107. "gbk_bin": 87,
  108. "sjis_bin": 88,
  109. "tis620_bin": 89,
  110. //"ucs2_bin": 90,
  111. "ujis_bin": 91,
  112. "geostd8_general_ci": 92,
  113. "geostd8_bin": 93,
  114. "latin1_spanish_ci": 94,
  115. "cp932_japanese_ci": 95,
  116. "cp932_bin": 96,
  117. "eucjpms_japanese_ci": 97,
  118. "eucjpms_bin": 98,
  119. "cp1250_polish_ci": 99,
  120. //"utf16_unicode_ci": 101,
  121. //"utf16_icelandic_ci": 102,
  122. //"utf16_latvian_ci": 103,
  123. //"utf16_romanian_ci": 104,
  124. //"utf16_slovenian_ci": 105,
  125. //"utf16_polish_ci": 106,
  126. //"utf16_estonian_ci": 107,
  127. //"utf16_spanish_ci": 108,
  128. //"utf16_swedish_ci": 109,
  129. //"utf16_turkish_ci": 110,
  130. //"utf16_czech_ci": 111,
  131. //"utf16_danish_ci": 112,
  132. //"utf16_lithuanian_ci": 113,
  133. //"utf16_slovak_ci": 114,
  134. //"utf16_spanish2_ci": 115,
  135. //"utf16_roman_ci": 116,
  136. //"utf16_persian_ci": 117,
  137. //"utf16_esperanto_ci": 118,
  138. //"utf16_hungarian_ci": 119,
  139. //"utf16_sinhala_ci": 120,
  140. //"utf16_german2_ci": 121,
  141. //"utf16_croatian_ci": 122,
  142. //"utf16_unicode_520_ci": 123,
  143. //"utf16_vietnamese_ci": 124,
  144. //"ucs2_unicode_ci": 128,
  145. //"ucs2_icelandic_ci": 129,
  146. //"ucs2_latvian_ci": 130,
  147. //"ucs2_romanian_ci": 131,
  148. //"ucs2_slovenian_ci": 132,
  149. //"ucs2_polish_ci": 133,
  150. //"ucs2_estonian_ci": 134,
  151. //"ucs2_spanish_ci": 135,
  152. //"ucs2_swedish_ci": 136,
  153. //"ucs2_turkish_ci": 137,
  154. //"ucs2_czech_ci": 138,
  155. //"ucs2_danish_ci": 139,
  156. //"ucs2_lithuanian_ci": 140,
  157. //"ucs2_slovak_ci": 141,
  158. //"ucs2_spanish2_ci": 142,
  159. //"ucs2_roman_ci": 143,
  160. //"ucs2_persian_ci": 144,
  161. //"ucs2_esperanto_ci": 145,
  162. //"ucs2_hungarian_ci": 146,
  163. //"ucs2_sinhala_ci": 147,
  164. //"ucs2_german2_ci": 148,
  165. //"ucs2_croatian_ci": 149,
  166. //"ucs2_unicode_520_ci": 150,
  167. //"ucs2_vietnamese_ci": 151,
  168. //"ucs2_general_mysql500_ci": 159,
  169. //"utf32_unicode_ci": 160,
  170. //"utf32_icelandic_ci": 161,
  171. //"utf32_latvian_ci": 162,
  172. //"utf32_romanian_ci": 163,
  173. //"utf32_slovenian_ci": 164,
  174. //"utf32_polish_ci": 165,
  175. //"utf32_estonian_ci": 166,
  176. //"utf32_spanish_ci": 167,
  177. //"utf32_swedish_ci": 168,
  178. //"utf32_turkish_ci": 169,
  179. //"utf32_czech_ci": 170,
  180. //"utf32_danish_ci": 171,
  181. //"utf32_lithuanian_ci": 172,
  182. //"utf32_slovak_ci": 173,
  183. //"utf32_spanish2_ci": 174,
  184. //"utf32_roman_ci": 175,
  185. //"utf32_persian_ci": 176,
  186. //"utf32_esperanto_ci": 177,
  187. //"utf32_hungarian_ci": 178,
  188. //"utf32_sinhala_ci": 179,
  189. //"utf32_german2_ci": 180,
  190. //"utf32_croatian_ci": 181,
  191. //"utf32_unicode_520_ci": 182,
  192. //"utf32_vietnamese_ci": 183,
  193. "utf8_unicode_ci": 192,
  194. "utf8_icelandic_ci": 193,
  195. "utf8_latvian_ci": 194,
  196. "utf8_romanian_ci": 195,
  197. "utf8_slovenian_ci": 196,
  198. "utf8_polish_ci": 197,
  199. "utf8_estonian_ci": 198,
  200. "utf8_spanish_ci": 199,
  201. "utf8_swedish_ci": 200,
  202. "utf8_turkish_ci": 201,
  203. "utf8_czech_ci": 202,
  204. "utf8_danish_ci": 203,
  205. "utf8_lithuanian_ci": 204,
  206. "utf8_slovak_ci": 205,
  207. "utf8_spanish2_ci": 206,
  208. "utf8_roman_ci": 207,
  209. "utf8_persian_ci": 208,
  210. "utf8_esperanto_ci": 209,
  211. "utf8_hungarian_ci": 210,
  212. "utf8_sinhala_ci": 211,
  213. "utf8_german2_ci": 212,
  214. "utf8_croatian_ci": 213,
  215. "utf8_unicode_520_ci": 214,
  216. "utf8_vietnamese_ci": 215,
  217. "utf8_general_mysql500_ci": 223,
  218. "utf8mb4_unicode_ci": 224,
  219. "utf8mb4_icelandic_ci": 225,
  220. "utf8mb4_latvian_ci": 226,
  221. "utf8mb4_romanian_ci": 227,
  222. "utf8mb4_slovenian_ci": 228,
  223. "utf8mb4_polish_ci": 229,
  224. "utf8mb4_estonian_ci": 230,
  225. "utf8mb4_spanish_ci": 231,
  226. "utf8mb4_swedish_ci": 232,
  227. "utf8mb4_turkish_ci": 233,
  228. "utf8mb4_czech_ci": 234,
  229. "utf8mb4_danish_ci": 235,
  230. "utf8mb4_lithuanian_ci": 236,
  231. "utf8mb4_slovak_ci": 237,
  232. "utf8mb4_spanish2_ci": 238,
  233. "utf8mb4_roman_ci": 239,
  234. "utf8mb4_persian_ci": 240,
  235. "utf8mb4_esperanto_ci": 241,
  236. "utf8mb4_hungarian_ci": 242,
  237. "utf8mb4_sinhala_ci": 243,
  238. "utf8mb4_german2_ci": 244,
  239. "utf8mb4_croatian_ci": 245,
  240. "utf8mb4_unicode_520_ci": 246,
  241. "utf8mb4_vietnamese_ci": 247,
  242. "gb18030_chinese_ci": 248,
  243. "gb18030_bin": 249,
  244. "gb18030_unicode_520_ci": 250,
  245. "utf8mb4_0900_ai_ci": 255,
  246. }
  247. // A denylist of collations which is unsafe to interpolate parameters.
  248. // These multibyte encodings may contains 0x5c (`\`) in their trailing bytes.
  249. var unsafeCollations = map[string]bool{
  250. "big5_chinese_ci": true,
  251. "sjis_japanese_ci": true,
  252. "gbk_chinese_ci": true,
  253. "big5_bin": true,
  254. "gb2312_bin": true,
  255. "gbk_bin": true,
  256. "sjis_bin": true,
  257. "cp932_japanese_ci": true,
  258. "cp932_bin": true,
  259. "gb18030_chinese_ci": true,
  260. "gb18030_bin": true,
  261. "gb18030_unicode_520_ci": true,
  262. }