swift-server · pokryfka · Aug 6, 2020 · Aug 6, 2020 · Aug 6, 2020 · Aug 7, 2020
diff --git a/Package.swift b/Package.swift
@@ -16,8 +16,11 @@ let package = Package(
     ],
     dependencies: [
         .package(url: "https://github.com/apple/swift-nio.git", .upToNextMajor(from: "2.17.0")),
+//        .package(url: "https://github.com/pokryfka/swift-nio.git", .branch("feature/tracing")),
         .package(url: "https://github.com/apple/swift-log.git", .upToNextMajor(from: "1.0.0")),
         .package(url: "https://github.com/swift-server/swift-backtrace.git", .upToNextMajor(from: "1.1.0")),
+        // TODO: use swift-tracing when available
+        .package(url: "https://github.com/pokryfka/aws-xray-sdk-swift.git", .upToNextMinor(from: "0.7.1")),
     ],
     targets: [
         .target(name: "AWSLambdaRuntime", dependencies: [
@@ -29,6 +32,7 @@ let package = Package(
             .product(name: "Logging", package: "swift-log"),
             .product(name: "Backtrace", package: "swift-backtrace"),
             .product(name: "NIOHTTP1", package: "swift-nio"),
+            .product(name: "AWSXRaySDK", package: "aws-xray-sdk-swift"),
         ]),
         .testTarget(name: "AWSLambdaRuntimeCoreTests", dependencies: [
             .byName(name: "AWSLambdaRuntimeCore"),
@@ -38,13 +42,15 @@ let package = Package(
         .testTarget(name: "AWSLambdaRuntimeTests", dependencies: [
             .byName(name: "AWSLambdaRuntimeCore"),
             .byName(name: "AWSLambdaRuntime"),
+            .product(name: "AWSXRayRecorder", package: "aws-xray-sdk-swift"),
         ]),
         .target(name: "AWSLambdaEvents", dependencies: []),
         .testTarget(name: "AWSLambdaEventsTests", dependencies: ["AWSLambdaEvents"]),
         // testing helper
         .target(name: "AWSLambdaTesting", dependencies: [
             .byName(name: "AWSLambdaRuntime"),
             .product(name: "NIO", package: "swift-nio"),
+            .product(name: "AWSXRayRecorder", package: "aws-xray-sdk-swift"),
         ]),
         .testTarget(name: "AWSLambdaTestingTests", dependencies: ["AWSLambdaTesting"]),
         // for perf testing

diff --git a/Sources/AWSLambdaRuntimeCore/HTTPClient.swift b/Sources/AWSLambdaRuntimeCore/HTTPClient.swift
@@ -12,6 +12,7 @@
 //
 //===----------------------------------------------------------------------===//
 
+import Baggage
 import NIO
 import NIOConcurrencyHelpers
 import NIOHTTP1
@@ -23,31 +24,35 @@ internal final class HTTPClient {
     private let eventLoop: EventLoop
     private let configuration: Lambda.Configuration.RuntimeEngine
     private let targetHost: String
+    private let tracer: TracingInstrument
 
     private var state = State.disconnected
     private var executing = false
 
-    init(eventLoop: EventLoop, configuration: Lambda.Configuration.RuntimeEngine) {
+    init(eventLoop: EventLoop, configuration: Lambda.Configuration.RuntimeEngine, tracer: TracingInstrument) {
         self.eventLoop = eventLoop
         self.configuration = configuration
         self.targetHost = "\(self.configuration.ip):\(self.configuration.port)"
+        self.tracer = tracer
     }
 
-    func get(url: String, headers: HTTPHeaders, timeout: TimeAmount? = nil) -> EventLoopFuture<Response> {
+    func get(url: String, headers: HTTPHeaders, timeout: TimeAmount? = nil, context: BaggageContext) -> EventLoopFuture<Response> {
         self.execute(Request(targetHost: self.targetHost,
                              url: url,
                              method: .GET,
                              headers: headers,
-                             timeout: timeout ?? self.configuration.requestTimeout))
+                             timeout: timeout ?? self.configuration.requestTimeout),
+                     context: context)
     }
 
-    func post(url: String, headers: HTTPHeaders, body: ByteBuffer?, timeout: TimeAmount? = nil) -> EventLoopFuture<Response> {
+    func post(url: String, headers: HTTPHeaders, body: ByteBuffer?, timeout: TimeAmount? = nil, context: BaggageContext) -> EventLoopFuture<Response> {
         self.execute(Request(targetHost: self.targetHost,
                              url: url,
                              method: .POST,
                              headers: headers,
                              body: body,
-                             timeout: timeout ?? self.configuration.requestTimeout))
+                             timeout: timeout ?? self.configuration.requestTimeout),
+                     context: context)
     }
 
     /// cancels the current request if there is one
@@ -65,7 +70,7 @@ internal final class HTTPClient {
     }
 
     // TODO: cap reconnect attempt
-    private func execute(_ request: Request, validate: Bool = true) -> EventLoopFuture<Response> {
+    private func execute(_ request: Request, validate: Bool = true, context: BaggageContext) -> EventLoopFuture<Response> {
         if validate {
             precondition(self.executing == false, "expecting single request at a time")
             self.executing = true
@@ -75,22 +80,24 @@ internal final class HTTPClient {
         case .disconnected:
             return self.connect().flatMap { channel -> EventLoopFuture<Response> in
                 self.state = .connected(channel)
-                return self.execute(request, validate: false)
+                return self.execute(request, validate: false, context: context)
             }
         case .connected(let channel):
             guard channel.isActive else {
                 self.state = .disconnected
-                return self.execute(request, validate: false)
+                return self.execute(request, validate: false, context: context)
             }
 
+            let segment = self.tracer.beginSegment(name: "HTTPClient", baggage: context)
+            segment.setHTTPRequest(method: request.method.rawValue, url: request.url)
             let promise = channel.eventLoop.makePromise(of: Response.self)
             promise.futureResult.whenComplete { _ in
                 precondition(self.executing == true, "invalid execution state")
                 self.executing = false
             }
             let wrapper = HTTPRequestWrapper(request: request, promise: promise)
             channel.writeAndFlush(wrapper).cascadeFailure(to: promise)
-            return promise.futureResult
+            return promise.futureResult.endSegment(segment)
         }
     }
 

diff --git a/Sources/AWSLambdaRuntimeCore/LambdaConfiguration.swift b/Sources/AWSLambdaRuntimeCore/LambdaConfiguration.swift
@@ -26,7 +26,8 @@ extension Lambda {
             self.init(general: .init(), lifecycle: .init(), runtimeEngine: .init())
         }
 
-        init(general: General? = nil, lifecycle: Lifecycle? = nil, runtimeEngine: RuntimeEngine? = nil) {
+        init(general: General? = nil, lifecycle: Lifecycle? = nil, runtimeEngine: RuntimeEngine? = nil)
+        {
             self.general = general ?? General()
             self.lifecycle = lifecycle ?? Lifecycle()
             self.runtimeEngine = runtimeEngine ?? RuntimeEngine()

diff --git a/Sources/AWSLambdaRuntimeCore/LambdaContext.swift b/Sources/AWSLambdaRuntimeCore/LambdaContext.swift
@@ -12,9 +12,12 @@
 //
 //===----------------------------------------------------------------------===//
 
+import AWSXRayRecorder
+import Baggage
 import Dispatch
 import Logging
 import NIO
+import NIOConcurrencyHelpers
 
 // MARK: - InitializationContext
 
@@ -50,6 +53,9 @@ extension Lambda {
     /// Lambda runtime context.
     /// The Lambda runtime generates and passes the `Context` to the Lambda handler as an argument.
     public final class Context: CustomDebugStringConvertible {
+        // TODO: use RWLock (separate PR)
+        private let lock = Lock()
+
         /// The request ID, which identifies the request that triggered the function invocation.
         public let requestID: String
 
@@ -68,11 +74,23 @@ extension Lambda {
         /// For invocations from the AWS Mobile SDK, data about the client application and device.
         public let clientContext: String?
 
+        // TODO: or should the Lambda "runtime" context and the Baggage context be separate?
+        private var _baggage: BaggageContext
+
+        /// Baggage context.
+        public var baggage: BaggageContext {
+            get { self.lock.withLock { _baggage } }
+            set { self.lock.withLockVoid { _baggage = newValue } }
+        }
+
         /// `Logger` to log with
         ///
         /// - note: The `LogLevel` can be configured using the `LOG_LEVEL` environment variable.
         public let logger: Logger
 
+        /// Tracing instrument.
+        public let tracer: TracingInstrument
+
         /// The `EventLoop` the Lambda is executed on. Use this to schedule work with.
         /// This is useful when implementing the `EventLoopLambdaHandler` protocol.
         ///
@@ -91,8 +109,10 @@ extension Lambda {
                       cognitoIdentity: String? = nil,
                       clientContext: String? = nil,
                       logger: Logger,
+                      tracer: TracingInstrument,
                       eventLoop: EventLoop,
-                      allocator: ByteBufferAllocator) {
+                      allocator: ByteBufferAllocator)
+        {
             self.requestID = requestID
             self.traceID = traceID
             self.invokedFunctionARN = invokedFunctionARN
@@ -106,7 +126,12 @@ extension Lambda {
             var logger = logger
             logger[metadataKey: "awsRequestID"] = .string(requestID)
             logger[metadataKey: "awsTraceID"] = .string(traceID)
+            var baggage = BaggageContext()
+            // TODO: use `swift-tracing` API, note that, regardless, we can ONLY extract X-Ray Context
+            baggage.xRayContext = try? XRayContext(tracingHeader: traceID)
+            self._baggage = baggage
             self.logger = logger
+            self.tracer = tracer
         }
 
         public func getRemainingTime() -> TimeAmount {

diff --git a/Sources/AWSLambdaRuntimeCore/LambdaHandler.swift b/Sources/AWSLambdaRuntimeCore/LambdaHandler.swift
@@ -129,18 +129,31 @@ public protocol EventLoopLambdaHandler: ByteBufferLambdaHandler {
 public extension EventLoopLambdaHandler {
     /// Driver for `ByteBuffer` -> `In` decoding and `Out` -> `ByteBuffer` encoding
     func handle(context: Lambda.Context, event: ByteBuffer) -> EventLoopFuture<ByteBuffer?> {
-        switch self.decodeIn(buffer: event) {
+        let segment = context.tracer.beginSegment(name: "HandleEvent", baggage: context.baggage)
+        let decodedEvent = segment.subsegment(name: "DecodeIn") { _ in
+            self.decodeIn(buffer: event)
+        }
+        switch decodedEvent {
         case .failure(let error):
+            segment.addError(error)
+            segment.end()
             return context.eventLoop.makeFailedFuture(CodecError.requestDecoding(error))
         case .success(let `in`):
-            return self.handle(context: context, event: `in`).flatMapThrowing { out in
-                switch self.encodeOut(allocator: context.allocator, value: out) {
-                case .failure(let error):
-                    throw CodecError.responseEncoding(error)
-                case .success(let buffer):
-                    return buffer
+            let subsegment = segment.beginSubsegment(name: "HandleIn")
+            context.baggage = subsegment.baggage
+            return self.handle(context: context, event: `in`)
+                .endSegment(subsegment)
+                .flatMapThrowing { out in
+                    try context.tracer.segment(name: "EncodeOut", baggage: segment.baggage) { _ in
+                        switch self.encodeOut(allocator: context.allocator, value: out) {
+                        case .failure(let error):
+                            throw CodecError.responseEncoding(error)
+                        case .success(let buffer):
+                            return buffer
+                        }
+                    }
                 }
-            }
+                .endSegment(segment)
         }
     }
 

diff --git a/Sources/AWSLambdaRuntimeCore/LambdaLifecycle.swift b/Sources/AWSLambdaRuntimeCore/LambdaLifecycle.swift
@@ -12,6 +12,7 @@
 //
 //===----------------------------------------------------------------------===//
 
+import AWSXRaySDK
 import Logging
 import NIO
 import NIOConcurrencyHelpers
@@ -78,7 +79,9 @@ extension Lambda {
 
             var logger = self.logger
             logger[metadataKey: "lifecycleId"] = .string(self.configuration.lifecycle.id)
-            let runner = Runner(eventLoop: self.eventLoop, configuration: self.configuration)
+
+            let tracer = XRayRecorder(eventLoopGroupProvider: .shared(eventLoop))
+            let runner = Runner(eventLoop: self.eventLoop, configuration: self.configuration, tracer: tracer)
 
             let startupFuture = runner.initialize(logger: logger, factory: self.factory)
             startupFuture.flatMap { handler -> EventLoopFuture<(ByteBufferLambdaHandler, Result<Int, Error>)> in
@@ -92,6 +95,11 @@ extension Lambda {
             .flatMap { (handler, runnerResult) -> EventLoopFuture<Int> in
                 // after the lambda finishPromise has succeeded or failed we need to
                 // shutdown the handler
+                tracer.shutdown { error in
+                    if let error = error {
+                        logger.error("Failed to shutdown tracer: \(error)")
+                    }
+                }
                 let shutdownContext = ShutdownContext(logger: logger, eventLoop: self.eventLoop)
                 return handler.shutdown(context: shutdownContext).flatMapErrorThrowing { error in
                     // if, we had an error shuting down the lambda, we want to concatenate it with

diff --git a/Sources/AWSLambdaRuntimeCore/LambdaRunner.swift b/Sources/AWSLambdaRuntimeCore/LambdaRunner.swift
@@ -12,22 +12,30 @@
 //
 //===----------------------------------------------------------------------===//
 
+import AWSXRaySDK // TODO: use swift-tracing when available
+import Baggage
 import Dispatch
 import Logging
 import NIO
 
+// type names defined in `TracingInstrument`, aliases will be removed
+public typealias TracingInstrument = XRayRecorder
+public typealias NoOpTracingInstrument = XRayNoOpRecorder
+
 extension Lambda {
     /// LambdaRunner manages the Lambda runtime workflow, or business logic.
     internal final class Runner {
         private let runtimeClient: RuntimeClient
+        private let tracer: TracingInstrument
         private let eventLoop: EventLoop
         private let allocator: ByteBufferAllocator
 
         private var isGettingNextInvocation = false
 
-        init(eventLoop: EventLoop, configuration: Configuration) {
+        init(eventLoop: EventLoop, configuration: Configuration, tracer: TracingInstrument) {
             self.eventLoop = eventLoop
-            self.runtimeClient = RuntimeClient(eventLoop: self.eventLoop, configuration: configuration.runtimeEngine)
+            self.runtimeClient = RuntimeClient(eventLoop: self.eventLoop, configuration: configuration.runtimeEngine, tracer: tracer)
+            self.tracer = tracer
             self.allocator = ByteBufferAllocator()
         }
 
@@ -60,15 +68,19 @@ extension Lambda {
             logger.debug("lambda invocation sequence starting")
             // 1. request invocation from lambda runtime engine
             self.isGettingNextInvocation = true
+            // we will get the trace context in the invocation
+            let startTime = XRayRecorder.Timestamp.now()
             return self.runtimeClient.getNextInvocation(logger: logger).peekError { error in
                 logger.error("could not fetch work from lambda runtime engine: \(error)")
             }.flatMap { invocation, event in
                 // 2. send invocation to handler
                 self.isGettingNextInvocation = false
                 let context = Context(logger: logger,
+                                      tracer: self.tracer,
                                       eventLoop: self.eventLoop,
                                       allocator: self.allocator,
                                       invocation: invocation)
+                self.tracer.beginSegment(name: "getNextInvocation", baggage: context.baggage, startTime: startTime).end()
                 logger.debug("sending invocation to lambda handler \(handler)")
                 return handler.handle(context: context, event: event)
                     // Hopping back to "our" EventLoop is importnant in case the handler returns a future that
@@ -80,14 +92,19 @@ extension Lambda {
                         if case .failure(let error) = result {
                             logger.warning("lambda handler returned an error: \(error)")
                         }
-                        return (invocation, result)
+                        return (invocation, result, context)
                     }
-            }.flatMap { invocation, result in
+            }.flatMap { (invocation, result, context: Context) in
                 // 3. report results to runtime engine
-                self.runtimeClient.reportResults(logger: logger, invocation: invocation, result: result).peekError { error in
-                    logger.error("could not report results to lambda runtime engine: \(error)")
+                self.tracer.segment(name: "ReportResults", baggage: context.baggage) { segment in
+                    self.runtimeClient.reportResults(logger: logger, invocation: invocation, result: result,
+                                                     context: segment.baggage).peekError { error in
+                        logger.error("could not report results to lambda runtime engine: \(error)")
+                    }
                 }
             }
+            // flush the tracer after each invocation
+            .flush(self.tracer, recover: false)
         }
 
         /// cancels the current run, if we are waiting for next invocation (long poll from Lambda control plane)
@@ -101,14 +118,15 @@ extension Lambda {
 }
 
 private extension Lambda.Context {
-    convenience init(logger: Logger, eventLoop: EventLoop, allocator: ByteBufferAllocator, invocation: Lambda.Invocation) {
+    convenience init(logger: Logger, tracer: TracingInstrument, eventLoop: EventLoop, allocator: ByteBufferAllocator, invocation: Lambda.Invocation) {
         self.init(requestID: invocation.requestID,
                   traceID: invocation.traceID,
                   invokedFunctionARN: invocation.invokedFunctionARN,
                   deadline: DispatchWallTime(millisSinceEpoch: invocation.deadlineInMillisSinceEpoch),
                   cognitoIdentity: invocation.cognitoIdentity,
                   clientContext: invocation.clientContext,
                   logger: logger,
+                  tracer: tracer,
                   eventLoop: eventLoop,
                   allocator: allocator)
     }