1
0

datadog.go 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244
  1. package datadog
  2. import (
  3. "context"
  4. "fmt"
  5. "log/slog"
  6. "net"
  7. "net/http"
  8. "os"
  9. "reflect"
  10. "strconv"
  11. "sync"
  12. "time"
  13. "github.com/DataDog/datadog-go/v5/statsd"
  14. "github.com/DataDog/dd-trace-go/v2/ddtrace/ext"
  15. "github.com/DataDog/dd-trace-go/v2/ddtrace/tracer"
  16. "github.com/felixge/httpsnoop"
  17. "github.com/imgproxy/imgproxy/v3/config"
  18. "github.com/imgproxy/imgproxy/v3/monitoring/errformat"
  19. "github.com/imgproxy/imgproxy/v3/monitoring/stats"
  20. "github.com/imgproxy/imgproxy/v3/version"
  21. )
  22. type spanCtxKey struct{}
  23. type GaugeFunc func() float64
  24. var (
  25. enabled bool
  26. enabledMetrics bool
  27. statsdClient *statsd.Client
  28. statsdClientStop chan struct{}
  29. gaugeFuncs = make(map[string]GaugeFunc)
  30. gaugeFuncsMutex sync.RWMutex
  31. )
  32. func Init() {
  33. if !config.DataDogEnable {
  34. return
  35. }
  36. name := os.Getenv("DD_SERVICE")
  37. if len(name) == 0 {
  38. name = "imgproxy"
  39. }
  40. logStartup := false
  41. if b, err := strconv.ParseBool(os.Getenv("DD_TRACE_STARTUP_LOGS")); err == nil {
  42. logStartup = b
  43. }
  44. tracer.Start(
  45. tracer.WithService(name),
  46. tracer.WithServiceVersion(version.Version),
  47. tracer.WithLogger(dataDogLogger{}),
  48. tracer.WithLogStartup(logStartup),
  49. )
  50. enabled = true
  51. statsdHost, statsdPort := os.Getenv("DD_AGENT_HOST"), os.Getenv("DD_DOGSTATSD_PORT")
  52. if len(statsdHost) == 0 {
  53. statsdHost = "localhost"
  54. }
  55. if len(statsdPort) == 0 {
  56. statsdPort = "8125"
  57. }
  58. if !config.DataDogEnableMetrics {
  59. return
  60. }
  61. var err error
  62. statsdClient, err = statsd.New(
  63. net.JoinHostPort(statsdHost, statsdPort),
  64. statsd.WithTags([]string{
  65. "service:" + name,
  66. "version:" + version.Version,
  67. }),
  68. )
  69. if err == nil {
  70. statsdClientStop = make(chan struct{})
  71. enabledMetrics = true
  72. go runMetricsCollector()
  73. } else {
  74. slog.Warn(fmt.Sprintf("Can't initialize DogStatsD client: %s", err))
  75. }
  76. }
  77. func Stop() {
  78. if enabled {
  79. tracer.Stop()
  80. if statsdClient != nil {
  81. close(statsdClientStop)
  82. statsdClient.Close()
  83. }
  84. }
  85. }
  86. func Enabled() bool {
  87. return enabled
  88. }
  89. func StartRootSpan(ctx context.Context, rw http.ResponseWriter, r *http.Request) (context.Context, context.CancelFunc, http.ResponseWriter) {
  90. if !enabled {
  91. return ctx, func() {}, rw
  92. }
  93. span := tracer.StartSpan(
  94. "request",
  95. tracer.Measured(),
  96. tracer.SpanType("web"),
  97. tracer.Tag(ext.HTTPMethod, r.Method),
  98. tracer.Tag(ext.HTTPURL, r.RequestURI),
  99. )
  100. cancel := func() { span.Finish() }
  101. newRw := httpsnoop.Wrap(rw, httpsnoop.Hooks{
  102. WriteHeader: func(next httpsnoop.WriteHeaderFunc) httpsnoop.WriteHeaderFunc {
  103. return func(statusCode int) {
  104. span.SetTag(ext.HTTPCode, statusCode)
  105. next(statusCode)
  106. }
  107. },
  108. })
  109. return context.WithValue(ctx, spanCtxKey{}, span), cancel, newRw
  110. }
  111. func setMetadata(span *tracer.Span, key string, value any) {
  112. if len(key) == 0 || value == nil {
  113. return
  114. }
  115. if rv := reflect.ValueOf(value); rv.Kind() == reflect.Map && rv.Type().Key().Kind() == reflect.String {
  116. for _, k := range rv.MapKeys() {
  117. setMetadata(span, key+"."+k.String(), rv.MapIndex(k).Interface())
  118. }
  119. return
  120. }
  121. span.SetTag(key, value)
  122. }
  123. func SetMetadata(ctx context.Context, key string, value any) {
  124. if !enabled {
  125. return
  126. }
  127. if rootSpan, ok := ctx.Value(spanCtxKey{}).(*tracer.Span); ok {
  128. setMetadata(rootSpan, key, value)
  129. }
  130. }
  131. func StartSpan(ctx context.Context, name string, meta map[string]any) context.CancelFunc {
  132. if !enabled {
  133. return func() {}
  134. }
  135. if rootSpan, ok := ctx.Value(spanCtxKey{}).(*tracer.Span); ok {
  136. span := rootSpan.StartChild(name, tracer.Measured())
  137. for k, v := range meta {
  138. setMetadata(span, k, v)
  139. }
  140. return func() { span.Finish() }
  141. }
  142. return func() {}
  143. }
  144. func SendError(ctx context.Context, errType string, err error) {
  145. if !enabled {
  146. return
  147. }
  148. if rootSpan, ok := ctx.Value(spanCtxKey{}).(*tracer.Span); ok {
  149. rootSpan.SetTag(ext.Error, err)
  150. rootSpan.SetTag(ext.ErrorType, errformat.FormatErrType(errType, err))
  151. }
  152. }
  153. func AddGaugeFunc(name string, f GaugeFunc) {
  154. gaugeFuncsMutex.Lock()
  155. defer gaugeFuncsMutex.Unlock()
  156. gaugeFuncs["imgproxy."+name] = f
  157. }
  158. func ObserveBufferSize(t string, size int) {
  159. if enabledMetrics {
  160. statsdClient.Histogram("imgproxy.buffer.size", float64(size), []string{"type:" + t}, 1)
  161. }
  162. }
  163. func SetBufferDefaultSize(t string, size int) {
  164. if enabledMetrics {
  165. statsdClient.Gauge("imgproxy.buffer.default_size", float64(size), []string{"type:" + t}, 1)
  166. }
  167. }
  168. func SetBufferMaxSize(t string, size int) {
  169. if enabledMetrics {
  170. statsdClient.Gauge("imgproxy.buffer.max_size", float64(size), []string{"type:" + t}, 1)
  171. }
  172. }
  173. func runMetricsCollector() {
  174. tick := time.NewTicker(10 * time.Second)
  175. defer tick.Stop()
  176. for {
  177. select {
  178. case <-tick.C:
  179. func() {
  180. gaugeFuncsMutex.RLock()
  181. defer gaugeFuncsMutex.RUnlock()
  182. for name, f := range gaugeFuncs {
  183. statsdClient.Gauge(name, f(), nil, 1)
  184. }
  185. }()
  186. statsdClient.Gauge("imgproxy.workers", float64(config.Workers), nil, 1)
  187. statsdClient.Gauge("imgproxy.requests_in_progress", stats.RequestsInProgress(), nil, 1)
  188. statsdClient.Gauge("imgproxy.images_in_progress", stats.ImagesInProgress(), nil, 1)
  189. statsdClient.Gauge("imgproxy.workers_utilization", stats.WorkersUtilization(), nil, 1)
  190. case <-statsdClientStop:
  191. return
  192. }
  193. }
  194. }
  195. type dataDogLogger struct {
  196. }
  197. func (l dataDogLogger) Log(msg string) {
  198. slog.Info(msg)
  199. }