agent.go 2.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112
  1. package trace
  2. import (
  3. "context"
  4. "fmt"
  5. "sync"
  6. "github.com/zeromicro/go-zero/core/lang"
  7. "github.com/zeromicro/go-zero/core/logx"
  8. "go.opentelemetry.io/otel"
  9. "go.opentelemetry.io/otel/exporters/jaeger"
  10. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc"
  11. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracehttp"
  12. "go.opentelemetry.io/otel/exporters/zipkin"
  13. "go.opentelemetry.io/otel/sdk/resource"
  14. sdktrace "go.opentelemetry.io/otel/sdk/trace"
  15. semconv "go.opentelemetry.io/otel/semconv/v1.4.0"
  16. )
  17. const (
  18. kindJaeger = "jaeger"
  19. kindZipkin = "zipkin"
  20. kindOtlpGrpc = "otlpgrpc"
  21. kindOtlpHttp = "otlphttp"
  22. )
  23. var (
  24. agents = make(map[string]lang.PlaceholderType)
  25. lock sync.Mutex
  26. tp *sdktrace.TracerProvider
  27. )
  28. // StartAgent starts an opentelemetry agent.
  29. func StartAgent(c Config) {
  30. lock.Lock()
  31. defer lock.Unlock()
  32. _, ok := agents[c.Endpoint]
  33. if ok {
  34. return
  35. }
  36. // if error happens, let later calls run.
  37. if err := startAgent(c); err != nil {
  38. return
  39. }
  40. agents[c.Endpoint] = lang.Placeholder
  41. }
  42. // StopAgent shuts down the span processors in the order they were registered.
  43. func StopAgent() {
  44. _ = tp.Shutdown(context.Background())
  45. }
  46. func createExporter(c Config) (sdktrace.SpanExporter, error) {
  47. // Just support jaeger and zipkin now, more for later
  48. switch c.Batcher {
  49. case kindJaeger:
  50. return jaeger.New(jaeger.WithCollectorEndpoint(jaeger.WithEndpoint(c.Endpoint)))
  51. case kindZipkin:
  52. return zipkin.New(c.Endpoint)
  53. case kindOtlpGrpc:
  54. // Always treat trace exporter as optional component, so we use nonblock here,
  55. // otherwise this would slow down app start up even set a dial timeout here when
  56. // endpoint can not reach.
  57. // If the connection not dial success, the global otel ErrorHandler will catch error
  58. // when reporting data like other exporters.
  59. return otlptracegrpc.New(
  60. context.Background(),
  61. otlptracegrpc.WithInsecure(),
  62. otlptracegrpc.WithEndpoint(c.Endpoint),
  63. )
  64. case kindOtlpHttp:
  65. // Not support flexible configuration now.
  66. return otlptracehttp.New(
  67. context.Background(),
  68. otlptracehttp.WithInsecure(),
  69. otlptracehttp.WithEndpoint(c.Endpoint),
  70. )
  71. default:
  72. return nil, fmt.Errorf("unknown exporter: %s", c.Batcher)
  73. }
  74. }
  75. func startAgent(c Config) error {
  76. opts := []sdktrace.TracerProviderOption{
  77. // Set the sampling rate based on the parent span to 100%
  78. sdktrace.WithSampler(sdktrace.ParentBased(sdktrace.TraceIDRatioBased(c.Sampler))),
  79. // Record information about this application in a Resource.
  80. sdktrace.WithResource(resource.NewSchemaless(semconv.ServiceNameKey.String(c.Name))),
  81. }
  82. if len(c.Endpoint) > 0 {
  83. exp, err := createExporter(c)
  84. if err != nil {
  85. logx.Error(err)
  86. return err
  87. }
  88. // Always be sure to batch in production.
  89. opts = append(opts, sdktrace.WithBatcher(exp))
  90. }
  91. tp = sdktrace.NewTracerProvider(opts...)
  92. otel.SetTracerProvider(tp)
  93. otel.SetErrorHandler(otel.ErrorHandlerFunc(func(err error) {
  94. logx.Errorf("[otel] error: %v", err)
  95. }))
  96. return nil
  97. }