使用切片值进行 Golang 字符串格式化

huangapple go评论106阅读模式

Golang string format using slice values





  1. import (
  2. "fmt"
  3. "strings"
  4. )
  5. func main() {
  6. nodes := []string{"node1", "node2"}
  7. var query string
  8. for _, n := range nodes {
  9. query += fmt.Sprintf("\"node_name\":\"%s\",", n)
  10. }
  11. query = strings.TrimRight(query, ",")
  12. final := fmt.Sprintf("where={%s}", query)
  13. fmt.Println(final)
  14. }

这是 goplayground 的链接。



Here I am trying to create a query string for my API from a slice containing strings.

ie. where={"node_name":"node1","node_name":"node_2"}

  1. import (
  2. "fmt"
  3. "strings"
  4. )
  5. func main() {
  6. nodes := []string{"node1", "node2"}
  7. var query string
  8. for _, n := range nodes {
  9. query += fmt.Sprintf("\"node_name\":\"%s\",", n)
  10. }
  11. query = strings.TrimRight(query, ",")
  12. final := fmt.Sprintf("where={%s}", query)
  13. fmt.Println(final)
  14. }

Here is goplayground link.

What is the best way to get the result?


得分: 16



完整可运行的代码可以在Go Playground上找到。完整的测试/基准测试代码也可以在Go Playground上找到,但不能运行,请将它们保存到你的Go工作区(例如$GOPATH/src/query/query.go$GOPATH/src/query/query_test.go),然后使用go test -bench .运行。





  1. func buildOriginal(nodes []string) string {
  2. var query string
  3. for _, n := range nodes {
  4. query += fmt.Sprintf("\"node_name\":\"%s\",", n)
  5. }
  6. query = strings.TrimRight(query, ",")
  7. return fmt.Sprintf("where={%s}", query)
  8. }



  1. func buildBuffer(nodes []string) string {
  2. buf := &bytes.Buffer{}
  3. buf.WriteString("where={")
  4. for i, v := range nodes {
  5. if i > 0 {
  6. buf.WriteByte(',')
  7. }
  8. buf.WriteString("\"node_name\":\"")
  9. buf.WriteString(v)
  10. buf.WriteByte('"')
  11. }
  12. buf.WriteByte('}')
  13. return buf.String()
  14. }


  1. nodes := []string{"node1", "node2"}
  2. fmt.Println(buildBuffer(nodes))


  1. where={"node_name":"node1","node_name":"node2"}




  1. func buildBuffer2(nodes []string) string {
  2. size := 8 + len(nodes)*15
  3. for _, v := range nodes {
  4. size += len(v)
  5. }
  6. buf := bytes.NewBuffer(make([]byte, 0, size))
  7. buf.WriteString("where={")
  8. for i, v := range nodes {
  9. if i > 0 {
  10. buf.WriteByte(',')
  11. }
  12. buf.WriteString("\"node_name\":\"")
  13. buf.WriteString(v)
  14. buf.WriteByte('"')
  15. }
  16. buf.WriteByte('}')
  17. return buf.String()
  18. }




  1. var t = template.Must(template.New("").Parse(templ))
  2. func buildTemplate(nodes []string) string {
  3. size := 8 + len(nodes)*15
  4. for _, v := range nodes {
  5. size += len(v)
  6. }
  7. buf := bytes.NewBuffer(make([]byte, 0, size))
  8. if err := t.Execute(buf, nodes); err != nil {
  9. log.Fatal(err) // 处理错误
  10. }
  11. return buf.String()
  12. }
  13. const templ = `where={
  14. {{- range $idx, $n := . -}}
  15. {{if ne $idx 0}},{{end}}"node_name":"{{$n}}"
  16. {{- end -}}
  17. }`




  1. func buildJoin(nodes []string) string {
  2. if len(nodes) == 0 {
  3. return "where={}"
  4. }
  5. return `where={"node_name":"` + strings.Join(nodes, `","node_name":"`) + `"}`
  6. }



  1. var nodes = []string{"n1", "node2", "nodethree", "fourthNode",
  2. "n1", "node2", "nodethree", "fourthNode",
  3. "n1", "node2", "nodethree", "fourthNode",
  4. "n1", "node2", "nodethree", "fourthNode",
  5. "n1", "node2", "nodethree", "fourthNode",
  6. }


  1. func BenchmarkOriginal(b *testing.B) {
  2. for i := 0; i < b.N; i++ {
  3. buildOriginal(nodes)
  4. }
  5. }
  6. func BenchmarkBuffer(b *testing.B) {
  7. for i := 0; i < b.N; i++ {
  8. buildBuffer(nodes)
  9. }
  10. }
  11. // ... 其他所有基准测试函数都相同


  1. BenchmarkOriginal-4 200000 10572 ns/op
  2. BenchmarkBuffer-4 500000 2914 ns/op
  3. BenchmarkBuffer2-4 1000000 2024 ns/op
  4. BenchmarkBufferTemplate-4 30000 77634 ns/op
  5. BenchmarkJoin-4 2000000 830 ns/op




Your solution uses way too many allocations due to string concatenations.

We'll create some alternative, faster and/or more elegant solutions. Note that the below solutions do not check if node values contain the quotation mark &quot; character. If they would, those would have to be escaped somehow (else the result would be an invalid query string).

The complete, runnable code can be found on the Go Playground. The complete testing / benchmarking code can also be found on the Go Playground, but it is not runnable, save both to your Go workspace (e.g. $GOPATH/src/query/query.go and $GOPATH/src/query/query_test.go) and run it with go test -bench ..

Also be sure to check out this related question: https://stackoverflow.com/questions/1760757/how-to-efficiently-concatenate-strings-in-go



Your logic can be captured by the following function:

  1. func buildOriginal(nodes []string) string {
  2. var query string
  3. for _, n := range nodes {
  4. query += fmt.Sprintf(&quot;\&quot;node_name\&quot;:\&quot;%s\&quot;,&quot;, n)
  5. }
  6. query = strings.TrimRight(query, &quot;,&quot;)
  7. return fmt.Sprintf(&quot;where={%s}&quot;, query)
  8. }

Using bytes.Buffer

Much better would be to use a single buffer, e.g. bytes.Buffer, build the query in that, and convert it to string at the end:

  1. func buildBuffer(nodes []string) string {
  2. buf := &amp;bytes.Buffer{}
  3. buf.WriteString(&quot;where={&quot;)
  4. for i, v := range nodes {
  5. if i &gt; 0 {
  6. buf.WriteByte(&#39;,&#39;)
  7. }
  8. buf.WriteString(`&quot;node_name&quot;:&quot;`)
  9. buf.WriteString(v)
  10. buf.WriteByte(&#39;&quot;&#39;)
  11. }
  12. buf.WriteByte(&#39;}&#39;)
  13. return buf.String()
  14. }

Using it:

  1. nodes := []string{&quot;node1&quot;, &quot;node2&quot;}
  2. fmt.Println(buildBuffer(nodes))


  1. where={&quot;node_name&quot;:&quot;node1&quot;,&quot;node_name&quot;:&quot;node2&quot;}

bytes.Buffer improved

bytes.Buffer will still do some reallocations, although much less than your original solution.

However, we can still reduce the allocations to 1, if we pass a big-enough byte slice when creating the bytes.Buffer using bytes.NewBuffer(). We can calculate the required size prior:

  1. func buildBuffer2(nodes []string) string {
  2. size := 8 + len(nodes)*15
  3. for _, v := range nodes {
  4. size += len(v)
  5. }
  6. buf := bytes.NewBuffer(make([]byte, 0, size))
  7. buf.WriteString(&quot;where={&quot;)
  8. for i, v := range nodes {
  9. if i &gt; 0 {
  10. buf.WriteByte(&#39;,&#39;)
  11. }
  12. buf.WriteString(`&quot;node_name&quot;:&quot;`)
  13. buf.WriteString(v)
  14. buf.WriteByte(&#39;&quot;&#39;)
  15. }
  16. buf.WriteByte(&#39;}&#39;)
  17. return buf.String()
  18. }

Note that in size calculation 8 is the size of the string where={} and 15 is the size of the string &quot;node_name&quot;:&quot;&quot;,.

Using text/template

We can also create a text template, and use the text/template package to execute it, efficiently generating the result:

  1. var t = template.Must(template.New(&quot;&quot;).Parse(templ))
  2. func buildTemplate(nodes []string) string {
  3. size := 8 + len(nodes)*15
  4. for _, v := range nodes {
  5. size += len(v)
  6. }
  7. buf := bytes.NewBuffer(make([]byte, 0, size))
  8. if err := t.Execute(buf, nodes); err != nil {
  9. log.Fatal(err) // Handle error
  10. }
  11. return buf.String()
  12. }
  13. const templ = `where={
  14. {{- range $idx, $n := . -}}
  15. {{if ne $idx 0}},{{end}}&quot;node_name&quot;:&quot;{{$n}}&quot;
  16. {{- end -}}
  17. }`

Using strings.Join()

This solution is interesting due to its simplicity. We can use strings.Join() to join the nodes with the static text &quot;,&quot;node_name&quot;:&quot; in between, proper prefix and postfix applied.

An important thing to note: strings.Join() uses the builtin copy() function with a single preallocated []byte buffer, so it's very fast! "As a special case, it (the copy() function) also will copy bytes from a string to a slice of bytes."

  1. func buildJoin(nodes []string) string {
  2. if len(nodes) == 0 {
  3. return &quot;where={}&quot;
  4. }
  5. return `where={&quot;node_name&quot;:&quot;` + strings.Join(nodes, `&quot;,&quot;node_name&quot;:&quot;`) + `&quot;}`
  6. }

Benchmark results

We'll benchmark with the following nodes value:

  1. var nodes = []string{&quot;n1&quot;, &quot;node2&quot;, &quot;nodethree&quot;, &quot;fourthNode&quot;,
  2. &quot;n1&quot;, &quot;node2&quot;, &quot;nodethree&quot;, &quot;fourthNode&quot;,
  3. &quot;n1&quot;, &quot;node2&quot;, &quot;nodethree&quot;, &quot;fourthNode&quot;,
  4. &quot;n1&quot;, &quot;node2&quot;, &quot;nodethree&quot;, &quot;fourthNode&quot;,
  5. &quot;n1&quot;, &quot;node2&quot;, &quot;nodethree&quot;, &quot;fourthNode&quot;,
  6. }

And the benchmarking code looks like this:

  1. func BenchmarkOriginal(b *testing.B) {
  2. for i := 0; i &lt; b.N; i++ {
  3. buildOriginal(nodes)
  4. }
  5. }
  6. func BenchmarkBuffer(b *testing.B) {
  7. for i := 0; i &lt; b.N; i++ {
  8. buildBuffer(nodes)
  9. }
  10. }
  11. // ... All the other benchmarking functions look the same

And now the results:

  1. BenchmarkOriginal-4 200000 10572 ns/op
  2. BenchmarkBuffer-4 500000 2914 ns/op
  3. BenchmarkBuffer2-4 1000000 2024 ns/op
  4. BenchmarkBufferTemplate-4 30000 77634 ns/op
  5. BenchmarkJoin-4 2000000 830 ns/op

Some unsurprising facts: buildBuffer() is 3.6 times faster than buildOriginal(), and buildBuffer2() (with pre-calculated size) is about 30% faster than buildBuffer() because it does not need to reallocate (and copy over) the internal buffer.

Some surprising facts: buildJoin() is extremely fast, even beats buildBuffer2() by 2.4 times (due to only using a []byte and copy()). buildTemplate() on the other hand proved quite slow: 7 times slower than buildOriginal(). The main reason for this is because it uses (has to use) reflection under the hood.

  • 本文由 发表于 2017年1月4日 14:12:03
  • 转载请务必保留本文链接:https://go.coder-hub.com/41457273.html



:?: :razz: :sad: :evil: :!: :smile: :oops: :grin: :eek: :shock: :???: :cool: :lol: :mad: :twisted: :roll: :wink: :idea: :arrow: :neutral: :cry: :mrgreen:
