網(wǎng)址鏈接中的中文編碼
中文的gbk(GB2312)編碼: 一個(gè)漢字對(duì)應(yīng)兩組%xx,即%xx%xx
中文的UTF-8編碼: 一個(gè)漢字對(duì)應(yīng)三組%xx猜谚,即%xx%xx%xx
from urllib.request import quote, unquote
# 編碼
url1 = "https://www.baidu.com/s?wd=中國(guó)"
# utf8編碼,指定安全字符
ret1 = quote(url1, safe=";/?:@&=+$,", encoding="utf-8")
>>> print (ret1)
https://www.baidu.com/s?wd=%E4%B8%AD%E5%9B%BD
# gbk編碼
ret2 = quote(url1, encoding="gbk")
>>> print (ret2)
https%3A//www.baidu.com/s%3Fwd%3D%D6%D0%B9%FA
# 解碼
url3 = "https://www.baidu.com/s?wd=%E4%B8%AD%E5%9B%BD"
ret3 = unquote(url3, encoding='utf-8')
>>> print (ret3)
https://www.baidu.com/s?wd=中國(guó)
from urllib.parse import urlencode
form_data = {"v1": 1, "v2": 2, "v3": 3, "v4": 4}
>>> print (urlencode(form_data))
v1=1&v2=2&v3=3&v4=4