当前位置：文江博客话题详情

Web开发程序设计

UTF-8字符集在AJAX下中文乱码的解决办法

发布于 2022-09-12 21:29:51 字数 4665 浏览 10 评论 0

转自http://bbs.lampbrother.net/read-htm-tid-2610.html

本以为全部UTF-8 就不用关心乱码问题了呢 , 结果乱码还是来了.. 查了点英文资料 , 搞定.

方法很简单 , 直接对提交的数据进行编码即可..

但是 UTF-8 的和ASCII的不怎么一样.. 下面是修正办法

var str = document.frm.username.value
修改成
var str = encode(document.frm.username.value)

然后在这个标记前面把下面代码复制进去

var unreserved = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz-_.~";
var reserved = "!*'();:@&=+$,/?%#[]";
var allowed = unreserved + reserved;
var hexchars = "0123456789ABCDEFabcdef";
// --------------------------------- Encoding -------------------------------
// This function returns a percent sign followed by two hexadecimal digits.
// Input is a decimal value not greater than 255.
function gethex(decimal) {
return "%" + hexchars.charAt(decimal >> 4) + hexchars.charAt(decimal & 0xF);
}
function encode(str) {
// Clear output field:
// Some variables:
var decoded = str;
var encoded = "";
for (var i = 0; i < decoded.length; i++ ) {
var ch = decoded.charAt(i);
// Check if character is an unreserved character:
if (unreserved.indexOf(ch) != -1) {
encoded = encoded + ch;
} else {
// The position in the Unicode table tells us how many bytes are needed.
// Note that if we talk about first, second, etc. in the following, we are
// counting from left to right:
//
// Position in | Bytes needed | Binary representation
// Unicode table | for UTF-8 | of UTF-8
// ----------------------------------------------------------
// 0 - 127 | 1 byte | 0XXX.XXXX
// 128 - 2047 | 2 bytes | 110X.XXXX 10XX.XXXX
// 2048 - 65535 | 3 bytes | 1110.XXXX 10XX.XXXX 10XX.XXXX
// 65536 - 2097151 | 4 bytes | 1111.0XXX 10XX.XXXX 10XX.XXXX 10XX.XXXX
var charcode = decoded.charCodeAt(i);
// Position 0 - 127 is equal to percent-encoding with an ASCII character encoding:
if (charcode < 128) {
encoded = encoded + gethex(charcode);
}
// Position 128 - 2047: two bytes for UTF-8 character encoding.
if (charcode > 127 && charcode < 2048) {
// First UTF byte: Mask the first five bits of charcode with binary 110X.XXXX:
encoded = encoded + gethex((charcode >> 6) | 0xC0);
// Second UTF byte: Get last six bits of charcode and mask them with binary 10XX.XXXX:
encoded = encoded + gethex((charcode & 0x3F) | 0x80);
}
// Position 2048 - 65535: three bytes for UTF-8 character encoding.
if (charcode > 2047 && charcode < 65536) {
// First UTF byte: Mask the first four bits of charcode with binary 1110.XXXX:
encoded = encoded + gethex((charcode >> 12) | 0xE0);
// Second UTF byte: Get the next six bits of charcode and mask them binary 10XX.XXXX:
encoded = encoded + gethex(((charcode >> 6) & 0x3F) | 0x80);
// Third UTF byte: Get the last six bits of charcode and mask them binary 10XX.XXXX:
encoded = encoded + gethex((charcode & 0x3F) | 0x80);
}
// Position 65536 - : four bytes for UTF-8 character encoding.
if (charcode > 65535) {
// First UTF byte: Mask the first three bits of charcode with binary 1111.0XXX:
encoded = encoded + gethex((charcode >> 18) | 0xF0);
// Second UTF byte: Get the next six bits of charcode and mask them binary 10XX.XXXX:
encoded = encoded + gethex(((charcode >> 12) & 0x3F) | 0x80);
// Third UTF byte: Get the last six bits of charcode and mask them binary 10XX.XXXX:
encoded = encoded + gethex(((charcode >> 6) & 0x3F) | 0x80);
// Fourth UTF byte: Get the last six bits of charcode and mask them binary 10XX.XXXX:
encoded = encoded + gethex((charcode & 0x3F) | 0x80);
}
}
} // end of for ...
// Write result:
return encoded;
}

复制代码ok，大功告成！

收藏 0

分享到微博

如果你对这篇内容有疑问，欢迎到本站社区发帖提问参与讨论，获取更多帮助，或者扫码二维码加入 Web 技术交流群。

扫码二维码加入Web技术交流群

发布评论

需要登录才能够评论，你可以免费注册一个本站的账号。

列表为空，暂无数据

关于作者

暂无简介

文章

评论

26 人气

关注发私信

相关话题

热门标签

操作系统程序设计 IT运维 Linux系统管理 JavaScript 服务器应用 solaris C/C++ PHP Shell BSD Vue.js aix Oracle Python HTML 系统管理 HTML5 CSS 前端

推荐作者

燃烧我的卡路李先生

文章 0 评论 0

qq_2gSKZM

文章 0 评论 0

∞梦里开花

文章 0 评论 0

qq_IklFPL

文章 0 评论 0

迷途知返

文章 0 评论 0

深海不蓝

文章 0 评论 0

友情链接

我们使用 Cookies 和其他技术来定制您的体验包括您的登录状态等。通过阅读我们的隐私政策了解更多相关信息。单击 接受 或继续使用网站，即表示您同意使用 Cookies 和您的相关数据。

原文