当前位置:   article > 正文

字符编码转换类, ANSI、Unicode、Unicode big endian、UTF-8、UTF-8+Bom互相转换_c# unicode ansi utf8 unicodebig5

c# unicode ansi utf8 unicodebig5
  1. <?php
  2. /** 字符编码转换类, ANSI、Unicode、Unicode big endian、UTF-8、UTF-8+Bom互相转换
  3. * Func:
  4. * public convert 转换
  5. * private convToUtf8 把编码转为UTF-8编码
  6. * private convFromUtf8 把UTF-8编码转换为输出编码
  7. */
  8. class CharsetConv { // class start
  9. private $_in_charset = null; // 源编码
  10. private $_out_charset = null; // 输出编码
  11. private $_allow_charset = array('utf-8', 'utf-8bom', 'ansi', 'unicode', 'unicodebe');
  12. /** 初始化
  13. * @param String $in_charset 源编码
  14. * @param String $out_charset 输出编码
  15. */
  16. public function __construct($in_charset, $out_charset) {
  17. $in_charset = strtolower($in_charset);
  18. $out_charset = strtolower($out_charset);
  19. // 检查源编码
  20. if (in_array($in_charset, $this->_allow_charset)) {
  21. $this->_in_charset = $in_charset;
  22. }
  23. // 检查输出编码
  24. if (in_array($out_charset, $this->_allow_charset)) {
  25. $this->_out_charset = $out_charset;
  26. }
  27. }
  28. /** 转换
  29. * @param String $str 要转换的字符串
  30. * @return String 转换后的字符串
  31. */
  32. public function convert($str) {
  33. $str = $this->convToUtf8($str); // 先转为utf8
  34. $str = $this->convFromUtf8($str); // 从utf8转为对应的编码
  35. return $str;
  36. }
  37. /** 把编码转为UTF-8编码
  38. * @param String $str
  39. * @return String
  40. */
  41. private function convToUtf8($str) {
  42. if ($this->_in_charset == 'utf-8') { // 编码已经是utf-8,不用转
  43. return $str;
  44. }
  45. switch ($this->_in_charset) {
  46. case 'utf-8bom':
  47. $str = substr($str, 3);
  48. break;
  49. case 'ansi':
  50. //$str = iconv('GBK', 'UTF-8', $str);
  51. $str = mb_convert_encoding($str, "UTF-8", "GBK");
  52. break;
  53. case 'unicode':
  54. //$str = iconv('UTF-16le', 'UTF-8', substr($str, 2));
  55. $str = mb_convert_encoding(substr($str, 2), "UTF-8", "UTF-16le");
  56. break;
  57. case 'unicodebe':
  58. //$str = iconv('UTF-16be', 'UTF-8', substr($str, 2));
  59. $str = mb_convert_encoding(substr($str, 2), "UTF-8", "UTF-16be");
  60. break;
  61. default:
  62. break;
  63. }
  64. return $str;
  65. }
  66. /** 把UTF-8编码转换为输出编码
  67. * @param String $str
  68. * @return String
  69. */
  70. private function convFromUtf8($str) {
  71. if ($this->_out_charset == 'utf-8') { // 输出编码已经是utf-8,不用转
  72. return $str;
  73. }
  74. switch ($this->_out_charset) {
  75. case 'utf-8bom':
  76. $str = "\xef\xbb\xbf" . $str;
  77. break;
  78. case 'ansi':
  79. //$str = iconv('UTF-8', 'GBK', $str);
  80. $str = mb_convert_encoding($str, "GBK", "UTF-8");
  81. break;
  82. case 'unicode':
  83. //$str = "\xff\xfe".iconv('UTF-8', 'UTF-16le', $str);
  84. $str = "\xff\xfe" . mb_convert_encoding($str, "UTF-16le", "UTF-8");
  85. break;
  86. case 'unicodebe':
  87. //$str = "\xfe\xff".iconv('UTF-8', 'UTF-16be', $str);
  88. $str = "\xfe\xff" . mb_convert_encoding($str, "UTF-16be", "UTF-8");
  89. break;
  90. default:
  91. break;
  92. }
  93. return $str;
  94. }
  95. } // class end
  96. ?>

 

本文内容由网友自发贡献,转载请注明出处:https://www.wpsshop.cn/w/笔触狂放9/article/detail/253379
推荐阅读
相关标签
  

闽ICP备14008679号