agent.go 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120
  1. package trace
  2. import (
  3. "context"
  4. "fmt"
  5. "net/url"
  6. "sync"
  7. "github.com/zeromicro/go-zero/core/lang"
  8. "github.com/zeromicro/go-zero/core/logx"
  9. "go.opentelemetry.io/otel"
  10. "go.opentelemetry.io/otel/exporters/jaeger"
  11. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc"
  12. "go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracehttp"
  13. "go.opentelemetry.io/otel/exporters/zipkin"
  14. "go.opentelemetry.io/otel/sdk/resource"
  15. sdktrace "go.opentelemetry.io/otel/sdk/trace"
  16. semconv "go.opentelemetry.io/otel/semconv/v1.4.0"
  17. )
  18. const (
  19. kindJaeger = "jaeger"
  20. kindZipkin = "zipkin"
  21. kindOtlpGrpc = "otlpgrpc"
  22. kindOtlpHttp = "otlphttp"
  23. )
  24. var (
  25. agents = make(map[string]lang.PlaceholderType)
  26. lock sync.Mutex
  27. tp *sdktrace.TracerProvider
  28. )
  29. // StartAgent starts an opentelemetry agent.
  30. func StartAgent(c Config) {
  31. lock.Lock()
  32. defer lock.Unlock()
  33. _, ok := agents[c.Endpoint]
  34. if ok {
  35. return
  36. }
  37. // if error happens, let later calls run.
  38. if err := startAgent(c); err != nil {
  39. return
  40. }
  41. agents[c.Endpoint] = lang.Placeholder
  42. }
  43. // StopAgent shuts down the span processors in the order they were registered.
  44. func StopAgent() {
  45. _ = tp.Shutdown(context.Background())
  46. }
  47. func createExporter(c Config) (sdktrace.SpanExporter, error) {
  48. // Just support jaeger and zipkin now, more for later
  49. switch c.Batcher {
  50. case kindJaeger:
  51. u, parseErr := url.Parse(c.Endpoint)
  52. if parseErr != nil {
  53. return nil, fmt.Errorf("invalid jaeger endpoint: %s", c.Endpoint)
  54. }
  55. if u.Scheme == "udp" {
  56. return jaeger.New(jaeger.WithAgentEndpoint(jaeger.WithAgentHost(u.Hostname()), jaeger.WithAgentPort(u.Port())))
  57. }
  58. return jaeger.New(jaeger.WithCollectorEndpoint(jaeger.WithEndpoint(c.Endpoint)))
  59. case kindZipkin:
  60. return zipkin.New(c.Endpoint)
  61. case kindOtlpGrpc:
  62. // Always treat trace exporter as optional component, so we use nonblock here,
  63. // otherwise this would slow down app start up even set a dial timeout here when
  64. // endpoint can not reach.
  65. // If the connection not dial success, the global otel ErrorHandler will catch error
  66. // when reporting data like other exporters.
  67. return otlptracegrpc.New(
  68. context.Background(),
  69. otlptracegrpc.WithInsecure(),
  70. otlptracegrpc.WithEndpoint(c.Endpoint),
  71. )
  72. case kindOtlpHttp:
  73. // Not support flexible configuration now.
  74. return otlptracehttp.New(
  75. context.Background(),
  76. otlptracehttp.WithInsecure(),
  77. otlptracehttp.WithEndpoint(c.Endpoint),
  78. )
  79. default:
  80. return nil, fmt.Errorf("unknown exporter: %s", c.Batcher)
  81. }
  82. }
  83. func startAgent(c Config) error {
  84. opts := []sdktrace.TracerProviderOption{
  85. // Set the sampling rate based on the parent span to 100%
  86. sdktrace.WithSampler(sdktrace.ParentBased(sdktrace.TraceIDRatioBased(c.Sampler))),
  87. // Record information about this application in a Resource.
  88. sdktrace.WithResource(resource.NewSchemaless(semconv.ServiceNameKey.String(c.Name))),
  89. }
  90. if len(c.Endpoint) > 0 {
  91. exp, err := createExporter(c)
  92. if err != nil {
  93. logx.Error(err)
  94. return err
  95. }
  96. // Always be sure to batch in production.
  97. opts = append(opts, sdktrace.WithBatcher(exp))
  98. }
  99. tp = sdktrace.NewTracerProvider(opts...)
  100. otel.SetTracerProvider(tp)
  101. otel.SetErrorHandler(otel.ErrorHandlerFunc(func(err error) {
  102. logx.Errorf("[otel] error: %v", err)
  103. }))
  104. return nil
  105. }