mapping-ISOLatin1Accent.txt 2.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236
  1. # This file contains character mappings for the default fulltext field type.
  2. # The source characters (on the left) will be replaced by the respective target
  3. # characters before any other processing takes place.
  4. # Lines starting with a pound character # are ignored.
  5. #
  6. # For sensible defaults, use the mapping-ISOLatin1Accent.txt file distributed
  7. # with the example application of your Solr version.
  8. #
  9. # Examples:
  10. # "À" => "A"
  11. # "\u00c4" => "A"
  12. # "\u00c4" => "\u0041"
  13. # "æ" => "ae"
  14. # "\n" => " "
  15. # À => A
  16. "\u00C0" => "A"
  17. # Á => A
  18. "\u00C1" => "A"
  19. # Â => A
  20. "\u00C2" => "A"
  21. # Ã => A
  22. "\u00C3" => "A"
  23. # Ä => A
  24. "\u00C4" => "A"
  25. # Å => A
  26. "\u00C5" => "A"
  27. # Æ => AE
  28. "\u00C6" => "AE"
  29. # Ç => C
  30. "\u00C7" => "C"
  31. # È => E
  32. "\u00C8" => "E"
  33. # É => E
  34. "\u00C9" => "E"
  35. # Ê => E
  36. "\u00CA" => "E"
  37. # Ë => E
  38. "\u00CB" => "E"
  39. # Ì => I
  40. "\u00CC" => "I"
  41. # Í => I
  42. "\u00CD" => "I"
  43. # Î => I
  44. "\u00CE" => "I"
  45. # Ï => I
  46. "\u00CF" => "I"
  47. # IJ => IJ
  48. "\u0132" => "IJ"
  49. # Ð => D
  50. "\u00D0" => "D"
  51. # Ñ => N
  52. "\u00D1" => "N"
  53. # Ò => O
  54. "\u00D2" => "O"
  55. # Ó => O
  56. "\u00D3" => "O"
  57. # Ô => O
  58. "\u00D4" => "O"
  59. # Õ => O
  60. "\u00D5" => "O"
  61. # Ö => O
  62. "\u00D6" => "O"
  63. # Ø => O
  64. "\u00D8" => "O"
  65. # Œ => OE
  66. "\u0152" => "OE"
  67. # Þ
  68. "\u00DE" => "TH"
  69. # Ù => U
  70. "\u00D9" => "U"
  71. # Ú => U
  72. "\u00DA" => "U"
  73. # Û => U
  74. "\u00DB" => "U"
  75. # Ü => U
  76. "\u00DC" => "U"
  77. # Ý => Y
  78. "\u00DD" => "Y"
  79. # Ÿ => Y
  80. "\u0178" => "Y"
  81. # à => a
  82. "\u00E0" => "a"
  83. # á => a
  84. "\u00E1" => "a"
  85. # â => a
  86. "\u00E2" => "a"
  87. # ã => a
  88. "\u00E3" => "a"
  89. # ä => a
  90. "\u00E4" => "a"
  91. # å => a
  92. "\u00E5" => "a"
  93. # æ => ae
  94. "\u00E6" => "ae"
  95. # ç => c
  96. "\u00E7" => "c"
  97. # è => e
  98. "\u00E8" => "e"
  99. # é => e
  100. "\u00E9" => "e"
  101. # ê => e
  102. "\u00EA" => "e"
  103. # ë => e
  104. "\u00EB" => "e"
  105. # ì => i
  106. "\u00EC" => "i"
  107. # í => i
  108. "\u00ED" => "i"
  109. # î => i
  110. "\u00EE" => "i"
  111. # ï => i
  112. "\u00EF" => "i"
  113. # ij => ij
  114. "\u0133" => "ij"
  115. # ð => d
  116. "\u00F0" => "d"
  117. # ñ => n
  118. "\u00F1" => "n"
  119. # ò => o
  120. "\u00F2" => "o"
  121. # ó => o
  122. "\u00F3" => "o"
  123. # ô => o
  124. "\u00F4" => "o"
  125. # õ => o
  126. "\u00F5" => "o"
  127. # ö => o
  128. "\u00F6" => "o"
  129. # ø => o
  130. "\u00F8" => "o"
  131. # œ => oe
  132. "\u0153" => "oe"
  133. # ß => ss
  134. "\u00DF" => "ss"
  135. # þ => th
  136. "\u00FE" => "th"
  137. # ù => u
  138. "\u00F9" => "u"
  139. # ú => u
  140. "\u00FA" => "u"
  141. # û => u
  142. "\u00FB" => "u"
  143. # ü => u
  144. "\u00FC" => "u"
  145. # ý => y
  146. "\u00FD" => "y"
  147. # ÿ => y
  148. "\u00FF" => "y"
  149. # ff => ff
  150. "\uFB00" => "ff"
  151. # fi => fi
  152. "\uFB01" => "fi"
  153. # fl => fl
  154. "\uFB02" => "fl"
  155. # ffi => ffi
  156. "\uFB03" => "ffi"
  157. # ffl => ffl
  158. "\uFB04" => "ffl"
  159. # ſt => ft
  160. "\uFB05" => "ft"
  161. # st => st
  162. "\uFB06" => "st"