解析 JSON HTTP 响应

huangapple go评论74阅读模式
英文:

Unmarshaling a json http response

问题

我最近开始尝试使用GO,并尝试对http://www.oref.org.il/WarningMessages/alerts.json的JSON响应进行解组。但是不知何故,解组失败,解组后的结构体为空(我猜测可能与编码有关)。

以下是代码,希望能帮到你。

谢谢,
Itay

package main

import (
  "fmt"
  "io/ioutil"
  "net/http"
  "encoding/json"
)

const alertsUrl = "http://www.oref.org.il/WarningMessages/alerts.json"

type Record struct {
  Id    string   `json:id`
  Title string   `json:title`
  Data  []string `json:data`
}

func main() {
  client := &http.Client{}
  req, err := http.NewRequest("GET", alertsUrl, nil)
  perror(err)

  req.Header.Add("Content-Type", "application/json; charset=utf-8")
  res, err := client.Do(req)
  perror(err)

  defer res.Body.Close()
  body, err := ioutil.ReadAll(res.Body)
  perror(err)

  var record Record
  json.Unmarshal(body, &record)
  fmt.Println(record)
}

func perror(err error) {
  if err != nil {
    panic(err)
  }
}
英文:

I have very recently started playing with GO and I am trying to unmarshal a JSON response from http://www.oref.org.il/WarningMessages/alerts.json.
For some reason that I can't understand the unmarshaling failed, the unmarshalled struct is empty (my guess is that it is somehow related to encoding).

Below is the code, any help is appreciated.

Thanks,
Itay

package main

import (
  "fmt"
  "io/ioutil"
  "net/http"
  "encoding/json"
)

const alertsUrl = "http://www.oref.org.il/WarningMessages/alerts.json"

type Record struct {
  Id string `json:id`
  Title string `json:title`
  Data []string `json:data`
}

func main() {
  client := &http.Client{}
  req, err := http.NewRequest("GET", alertsUrl, nil)
  perror(err)

  req.Header.Add("Content-Type", "application/json; charset=utf-8")
  res, err := client.Do(req)
  perror(err)

  defer res.Body.Close()
  body, err := ioutil.ReadAll(res.Body)
  perror(err)

  var record Record
  json.Unmarshal(body, &record)
  fmt.Println(record)
}

func perror(err error) {
  if err != nil {
    panic(err)
  }
}

答案1

得分: 3

你正在忽略JSON Unmarshal的错误:

func Unmarshal(data []byte, v interface{}) error

注意它返回一个错误。在代码中添加错误处理:

err = json.Unmarshal(body, &record)
perror(err)

看起来这是一个Unicode错误 - 你需要解码UTF-16数据

你应该如何做到这一点?看一下这个答案。基本上,一旦你像body, err := ioutil.ReadAll(res.Body)这样读取了响应体,你就想将UTF-16字节解码为字符串。这里有很多事情要做,但我们可以做一些简化:例如,打开URL在Chrome中,浏览器告诉我们它是UTF-16 LE编码。所以我们可以跳过字节顺序的检测。所以关键在于这个函数:

func UTF16BytesToString(b []byte, o binary.ByteOrder) string {
    utf := make([]uint16, (len(b)+(2-1))/2)
    for i := 0; i+(2-1) < len(b); i += 2 {
        utf[i/2] = o.Uint16(b[i:])
    }
    if len(b)/2 < len(utf) {
        utf[len(utf)-1] = utf8.RuneError
    }
    return string(utf16.Decode(utf))
}

通过知道字节顺序并传递它,这将把原始的字节数组转换为UTF-16字符的字符串。感谢用户OneOfOne的评论,我们还可以轻松地检测BOM。

结果代码如下:

package main

import (
    "encoding/binary"
    "encoding/json"
    "fmt"
    "io/ioutil"
    "net/http"
    "unicode/utf16"
    "unicode/utf8"
)

const alertsUrl = "http://www.oref.org.il/WarningMessages/alerts.json"

type Record struct {
    Id    string   `json:id`
    Title string   `json:title`
    Data  []string `json:data`
}

// LazyUTF16BytesToString将UTF-16编码的字节,以大端或小端字节顺序,
// 转换为UTF-8编码的字符串。
func LazyUTF16BytesToString(b []byte) string {
    if len(b)%2 != 0 {
        panic("len(b) % 2 != 0")
    }

    var codec binary.ByteOrder = binary.LittleEndian
    if b[0] == 0xFE && b[1] == 0xFF { //检查并去除BOM
        b = b[2:]
        codec = binary.BigEndian
    } else if b[0] == 0xFF && b[1] == 0xFE {
        b = b[2:]
    }

    utf := make([]uint16, (len(b)+(2-1))/2)
    for i := 0; i+(2-1) < len(b); i += 2 {
        utf[i/2] = codec.Uint16(b[i:])
    }
    if len(b)/2 < len(utf) {
        utf[len(utf)-1] = utf8.RuneError
    }
    return string(utf16.Decode(utf))
}

func main() {
    client := &http.Client{}
    req, err := http.NewRequest("GET", alertsUrl, nil)
    perror(err)

    req.Header.Add("Content-Type", "application/json; charset=utf-8")
    res, err := client.Do(req)
    perror(err)

    defer res.Body.Close()
    body, err := ioutil.ReadAll(res.Body)
    perror(err)

    bodyString := LazyUTF16BytesToString(body)

    var record Record
    err = json.Unmarshal([]byte(bodyString), &record)
    perror(err)
    fmt.Println(record)
}

func perror(err error) {
    if err != nil {
        panic(err)
    }
}

希望对你有帮助!

英文:

You're ignoring the error on JSON Unmarshal:

func Unmarshal(data []byte, v interface{}) error

See that it returns an error. Adding that in,

err = json.Unmarshal(body, &amp;record)
perror(err)

It looks like this is a Unicode error — you need to decode the UTF-16 data.

How should you do this? Take a look at this answer. Basically once you read the body like body, err := ioutil.ReadAll(res.Body), you want to decode the UTF-16 bytes to a string. There is a lot going on there, but we can take some liberties: for instance, pulling up the URL in Chrome, the browser tells us that it is UTF-16 LE. So we can skip the ByteOrder detection. So the key here is this function:

func UTF16BytesToString(b []byte, o binary.ByteOrder) string {
utf := make([]uint16, (len(b)+(2-1))/2)
for i := 0; i+(2-1) &lt; len(b); i += 2 {
utf[i/2] = o.Uint16(b[i:])
}
if len(b)/2 &lt; len(utf) {
utf[len(utf)-1] = utf8.RuneError
}
return string(utf16.Decode(utf))
}

Knowing our byte order and passing it in, this will convert the naïve byte array to a string of UTF-16 characters. Thanks to user OneOfOne's comment, we can also detect the BOM easily.

The result:

package main
import (
&quot;encoding/binary&quot;
&quot;encoding/json&quot;
&quot;fmt&quot;
&quot;io/ioutil&quot;
&quot;net/http&quot;
&quot;unicode/utf16&quot;
&quot;unicode/utf8&quot;
)
const alertsUrl = &quot;http://www.oref.org.il/WarningMessages/alerts.json&quot;
type Record struct {
Id    string   `json:id`
Title string   `json:title`
Data  []string `json:data`
}
// LazyUTF16BytesToString converts UTF-16 encoded bytes, in big or little endian byte order,
// to a UTF-8 encoded string.
func LazyUTF16BytesToString(b []byte) string {
if len(b)%2 != 0 {
panic(&quot;len(b) % 2 != 0&quot;)
}
var codec binary.ByteOrder = binary.LittleEndian
if b[0] == 0xFE &amp;&amp; b[1] == 0xFF { //check and strip the BOM
b = b[2:]
codec = binary.BigEndian
} else if b[0] == 0xFF &amp;&amp; b[1] == 0xFE {
b = b[2:]
}
utf := make([]uint16, (len(b)+(2-1))/2)
for i := 0; i+(2-1) &lt; len(b); i += 2 {
utf[i/2] = codec.Uint16(b[i:])
}
if len(b)/2 &lt; len(utf) {
utf[len(utf)-1] = utf8.RuneError
}
return string(utf16.Decode(utf))
}
func main() {
client := &amp;http.Client{}
req, err := http.NewRequest(&quot;GET&quot;, alertsUrl, nil)
perror(err)
req.Header.Add(&quot;Content-Type&quot;, &quot;application/json; charset=utf-8&quot;)
res, err := client.Do(req)
perror(err)
defer res.Body.Close()
body, err := ioutil.ReadAll(res.Body)
perror(err)
bodyString := LazyUTF16BytesToString(body)
var record Record
err = json.Unmarshal([]byte(bodyString), &amp;record)
perror(err)
fmt.Println(record)
}
func perror(err error) {
if err != nil {
panic(err)
}
}

huangapple
  • 本文由 发表于 2014年7月11日 00:21:08
  • 转载请务必保留本文链接:https://go.coder-hub.com/24681644.html
匿名

发表评论

匿名网友

:?: :razz: :sad: :evil: :!: :smile: :oops: :grin: :eek: :shock: :???: :cool: :lol: :mad: :twisted: :roll: :wink: :idea: :arrow: :neutral: :cry: :mrgreen:

确定