agent.go 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116
  1. package trace
  2. import (
  3. "context"
  4. "fmt"
  5. "sync"
  6. "github.com/zeromicro/go-zero/core/lang"
  7. "github.com/zeromicro/go-zero/core/logx"
  8. "go.opentelemetry.io/otel"
  9. "go.opentelemetry.io/otel/exporters/jaeger"
  10. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc"
  11. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracehttp"
  12. "go.opentelemetry.io/otel/exporters/zipkin"
  13. "go.opentelemetry.io/otel/sdk/resource"
  14. sdktrace "go.opentelemetry.io/otel/sdk/trace"
  15. semconv "go.opentelemetry.io/otel/semconv/v1.4.0"
  16. )
  17. const (
  18. kindJaeger = "jaeger"
  19. kindJaegerUdp = "jaegerudp"
  20. kindZipkin = "zipkin"
  21. kindOtlpGrpc = "otlpgrpc"
  22. kindOtlpHttp = "otlphttp"
  23. )
  24. var (
  25. agents = make(map[string]lang.PlaceholderType)
  26. lock sync.Mutex
  27. tp *sdktrace.TracerProvider
  28. )
  29. // StartAgent starts an opentelemetry agent.
  30. func StartAgent(c Config) {
  31. lock.Lock()
  32. defer lock.Unlock()
  33. _, ok := agents[c.Endpoint]
  34. if ok {
  35. return
  36. }
  37. // if error happens, let later calls run.
  38. if err := startAgent(c); err != nil {
  39. return
  40. }
  41. agents[c.Endpoint] = lang.Placeholder
  42. }
  43. // StopAgent shuts down the span processors in the order they were registered.
  44. func StopAgent() {
  45. _ = tp.Shutdown(context.Background())
  46. }
  47. func createExporter(c Config) (sdktrace.SpanExporter, error) {
  48. // Just support jaeger and zipkin now, more for later
  49. switch c.Batcher {
  50. case kindJaeger:
  51. return jaeger.New(jaeger.WithCollectorEndpoint(jaeger.WithEndpoint(c.Endpoint)))
  52. case kindJaegerUdp:
  53. host, port := c.parseEndpoint()
  54. return jaeger.New(jaeger.WithAgentEndpoint(jaeger.WithAgentHost(host), jaeger.WithAgentPort(port)))
  55. case kindZipkin:
  56. return zipkin.New(c.Endpoint)
  57. case kindOtlpGrpc:
  58. // Always treat trace exporter as optional component, so we use nonblock here,
  59. // otherwise this would slow down app start up even set a dial timeout here when
  60. // endpoint can not reach.
  61. // If the connection not dial success, the global otel ErrorHandler will catch error
  62. // when reporting data like other exporters.
  63. return otlptracegrpc.New(
  64. context.Background(),
  65. otlptracegrpc.WithInsecure(),
  66. otlptracegrpc.WithEndpoint(c.Endpoint),
  67. )
  68. case kindOtlpHttp:
  69. // Not support flexible configuration now.
  70. return otlptracehttp.New(
  71. context.Background(),
  72. otlptracehttp.WithInsecure(),
  73. otlptracehttp.WithEndpoint(c.Endpoint),
  74. )
  75. default:
  76. return nil, fmt.Errorf("unknown exporter: %s", c.Batcher)
  77. }
  78. }
  79. func startAgent(c Config) error {
  80. opts := []sdktrace.TracerProviderOption{
  81. // Set the sampling rate based on the parent span to 100%
  82. sdktrace.WithSampler(sdktrace.ParentBased(sdktrace.TraceIDRatioBased(c.Sampler))),
  83. // Record information about this application in a Resource.
  84. sdktrace.WithResource(resource.NewSchemaless(semconv.ServiceNameKey.String(c.Name))),
  85. }
  86. if len(c.Endpoint) > 0 {
  87. exp, err := createExporter(c)
  88. if err != nil {
  89. logx.Error(err)
  90. return err
  91. }
  92. // Always be sure to batch in production.
  93. opts = append(opts, sdktrace.WithBatcher(exp))
  94. }
  95. tp = sdktrace.NewTracerProvider(opts...)
  96. otel.SetTracerProvider(tp)
  97. otel.SetErrorHandler(otel.ErrorHandlerFunc(func(err error) {
  98. logx.Errorf("[otel] error: %v", err)
  99. }))
  100. return nil
  101. }