labelImage.go 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. // Copyright 2021 EMQ Technologies Co., Ltd.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. // +build tflite
  15. package main
  16. import (
  17. "bufio"
  18. "bytes"
  19. "fmt"
  20. "github.com/lf-edge/ekuiper/pkg/api"
  21. tflite "github.com/mattn/go-tflite"
  22. "github.com/nfnt/resize"
  23. "image"
  24. _ "image/jpeg"
  25. _ "image/png"
  26. "os"
  27. "path"
  28. "sort"
  29. "sync"
  30. )
  31. type labelImage struct {
  32. modelPath string
  33. labelPath string
  34. once sync.Once
  35. interpreter *tflite.Interpreter
  36. labels []string
  37. }
  38. func (f *labelImage) Validate(args []interface{}) error {
  39. if len(args) != 1 {
  40. return fmt.Errorf("labelImage function only supports 1 parameter but got %d", len(args))
  41. }
  42. return nil
  43. }
  44. func (f *labelImage) Exec(args []interface{}, ctx api.FunctionContext) (interface{}, bool) {
  45. arg0, ok := args[0].([]byte)
  46. if !ok {
  47. return fmt.Errorf("labelImage function parameter must be a bytea, but got %[1]T(%[1]v)", args[0]), false
  48. }
  49. img, _, err := image.Decode(bytes.NewReader(arg0))
  50. if err != nil {
  51. return err, false
  52. }
  53. var outerErr error
  54. f.once.Do(func() {
  55. ploc := path.Join(ctx.GetRootPath(), "etc", "functions")
  56. f.labels, err = loadLabels(path.Join(ploc, f.labelPath))
  57. if err != nil {
  58. outerErr = fmt.Errorf("fail to load labels: %s", err)
  59. return
  60. }
  61. model := tflite.NewModelFromFile(path.Join(ploc, f.modelPath))
  62. if model == nil {
  63. outerErr = fmt.Errorf("fail to load model: %s", err)
  64. return
  65. }
  66. defer model.Delete()
  67. options := tflite.NewInterpreterOptions()
  68. options.SetNumThread(4)
  69. options.SetErrorReporter(func(msg string, user_data interface{}) {
  70. fmt.Println(msg)
  71. }, nil)
  72. defer options.Delete()
  73. interpreter := tflite.NewInterpreter(model, options)
  74. if interpreter == nil {
  75. outerErr = fmt.Errorf("cannot create interpreter")
  76. return
  77. }
  78. status := interpreter.AllocateTensors()
  79. if status != tflite.OK {
  80. outerErr = fmt.Errorf("allocate failed")
  81. interpreter.Delete()
  82. return
  83. }
  84. f.interpreter = interpreter
  85. // TODO If created, the interpreter will be kept through the whole life of kuiper. Refactor this later.
  86. //defer interpreter.Delete()
  87. })
  88. if f.interpreter == nil {
  89. return fmt.Errorf("fail to load model %s %s", f.modelPath, outerErr), false
  90. }
  91. input := f.interpreter.GetInputTensor(0)
  92. wantedHeight := input.Dim(1)
  93. wantedWidth := input.Dim(2)
  94. wantedChannels := input.Dim(3)
  95. wantedType := input.Type()
  96. resized := resize.Resize(uint(wantedWidth), uint(wantedHeight), img, resize.NearestNeighbor)
  97. bounds := resized.Bounds()
  98. dx, dy := bounds.Dx(), bounds.Dy()
  99. if wantedType == tflite.UInt8 {
  100. bb := make([]byte, dx*dy*wantedChannels)
  101. for y := 0; y < dy; y++ {
  102. for x := 0; x < dx; x++ {
  103. col := resized.At(x, y)
  104. r, g, b, _ := col.RGBA()
  105. bb[(y*dx+x)*3+0] = byte(float64(r) / 255.0)
  106. bb[(y*dx+x)*3+1] = byte(float64(g) / 255.0)
  107. bb[(y*dx+x)*3+2] = byte(float64(b) / 255.0)
  108. }
  109. }
  110. input.CopyFromBuffer(bb)
  111. } else {
  112. return fmt.Errorf("is not wanted type"), false
  113. }
  114. status := f.interpreter.Invoke()
  115. if status != tflite.OK {
  116. return fmt.Errorf("invoke failed"), false
  117. }
  118. output := f.interpreter.GetOutputTensor(0)
  119. outputSize := output.Dim(output.NumDims() - 1)
  120. b := make([]byte, outputSize)
  121. type result struct {
  122. score float64
  123. index int
  124. }
  125. status = output.CopyToBuffer(&b[0])
  126. if status != tflite.OK {
  127. return fmt.Errorf("output failed"), false
  128. }
  129. var results []result
  130. for i := 0; i < outputSize; i++ {
  131. score := float64(b[i]) / 255.0
  132. if score < 0.2 {
  133. continue
  134. }
  135. results = append(results, result{score: score, index: i})
  136. }
  137. sort.Slice(results, func(i, j int) bool {
  138. return results[i].score > results[j].score
  139. })
  140. // output is the biggest score labelImage
  141. if len(results) > 0 {
  142. return f.labels[results[0].index], true
  143. } else {
  144. return "", true
  145. }
  146. }
  147. func (f *labelImage) IsAggregate() bool {
  148. return false
  149. }
  150. func loadLabels(filename string) ([]string, error) {
  151. labels := []string{}
  152. f, err := os.Open(filename)
  153. if err != nil {
  154. return nil, err
  155. }
  156. defer f.Close()
  157. scanner := bufio.NewScanner(f)
  158. for scanner.Scan() {
  159. labels = append(labels, scanner.Text())
  160. }
  161. return labels, nil
  162. }
  163. var LabelImage = labelImage{
  164. modelPath: "labelImage/mobilenet_quant_v1_224.tflite",
  165. labelPath: "labelImage/labels.txt",
  166. }