skywalking/agent/protocol/grpc_aio.py (148 lines of code) (raw):
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
import logging
import traceback
from asyncio import Queue, Event
import grpc
from skywalking import config
from skywalking.agent.protocol import ProtocolAsync
from skywalking.agent.protocol.interceptors_aio import header_adder_interceptor_async
from skywalking.client.grpc_aio import GrpcServiceManagementClientAsync, GrpcTraceSegmentReportServiceAsync, \
GrpcProfileTaskChannelServiceAsync, GrpcLogReportServiceAsync, GrpcMeterReportServiceAsync
from skywalking.loggings import logger, logger_debug_enabled
from skywalking.profile.profile_task import ProfileTask
from skywalking.profile.snapshot import TracingThreadSnapshot
from skywalking.protocol.common.Common_pb2 import KeyStringValuePair
from skywalking.protocol.language_agent.Tracing_pb2 import SegmentObject, SpanObject, Log, SegmentReference
from skywalking.protocol.logging.Logging_pb2 import LogData
from skywalking.protocol.language_agent.Meter_pb2 import MeterData
from skywalking.protocol.profile.Profile_pb2 import ThreadSnapshot, ThreadStack
from skywalking.trace.segment import Segment
class GrpcProtocolAsync(ProtocolAsync):
"""
grpc for asyncio
"""
def __init__(self):
self.properties_sent = Event()
# grpc.aio.channel do not have subscribe() method to set a callback when channel state changed
# instead, it has wait_for_state_change()/get_state() method to get the current state of the channel
# since here is an inherent race between the invocation of `wait_for_state_change` and `get_state`,
# and the channel state is only used for debug, the cost of monitoring this value is too high to support.
# self.state = None
interceptors = None
if config.agent_authentication:
interceptors = [header_adder_interceptor_async('authentication', config.agent_authentication)]
if config.agent_force_tls:
self.channel = grpc.aio.secure_channel(config.agent_collector_backend_services,
grpc.ssl_channel_credentials(), interceptors=interceptors)
else:
self.channel = grpc.aio.insecure_channel(config.agent_collector_backend_services,
interceptors=interceptors)
self.service_management = GrpcServiceManagementClientAsync(self.channel)
self.traces_reporter = GrpcTraceSegmentReportServiceAsync(self.channel)
self.log_reporter = GrpcLogReportServiceAsync(self.channel)
self.meter_reporter = GrpcMeterReportServiceAsync(self.channel)
self.profile_channel = GrpcProfileTaskChannelServiceAsync(self.channel)
async def query_profile_commands(self):
if logger_debug_enabled:
logger.debug('query profile commands')
await self.profile_channel.do_query()
async def notify_profile_task_finish(self, task: ProfileTask):
await self.profile_channel.finish(task)
async def heartbeat(self):
try:
if not self.properties_sent.is_set():
await self.service_management.send_instance_props()
self.properties_sent.set()
await self.service_management.send_heart_beat()
except grpc.aio.AioRpcError:
self.on_error()
raise
def on_error(self):
if logger_debug_enabled:
logger.debug('error occurred in grpc protocol (Async)')
traceback.print_exc() if logger.isEnabledFor(logging.DEBUG) else None
async def report_segment(self, queue: Queue):
async def generator():
while True:
# Let eventloop schedule blocking instead of user configuration: `config.agent_queue_timeout`
segment = await queue.get() # type: Segment
queue.task_done()
if logger_debug_enabled:
logger.debug('reporting segment %s', segment)
s = SegmentObject(
traceId=str(segment.related_traces[0]),
traceSegmentId=str(segment.segment_id),
service=config.agent_name,
serviceInstance=config.agent_instance_name,
isSizeLimited=segment.is_size_limited,
spans=[SpanObject(
spanId=span.sid,
parentSpanId=span.pid,
startTime=span.start_time,
endTime=span.end_time,
operationName=span.op,
peer=span.peer,
spanType=span.kind.name,
spanLayer=span.layer.name,
componentId=span.component.value,
isError=span.error_occurred,
logs=[Log(
time=int(log.timestamp * 1000),
data=[KeyStringValuePair(key=item.key, value=item.val) for item in log.items],
) for log in span.logs],
tags=[KeyStringValuePair(
key=tag.key,
value=tag.val,
) for tag in span.iter_tags()],
refs=[SegmentReference(
refType=0 if ref.ref_type == 'CrossProcess' else 1,
traceId=ref.trace_id,
parentTraceSegmentId=ref.segment_id,
parentSpanId=ref.span_id,
parentService=ref.service,
parentServiceInstance=ref.service_instance,
parentEndpoint=ref.endpoint,
networkAddressUsedAtPeer=ref.client_address,
) for ref in span.refs if ref.trace_id],
) for span in segment.spans],
)
yield s
try:
await self.traces_reporter.report(generator())
except grpc.aio.AioRpcError:
self.on_error()
raise # reraise so that incremental reconnect wait can process
async def report_log(self, queue: Queue):
async def generator():
while True:
# Let eventloop schedule blocking instead of user configuration: `config.agent_queue_timeout`
log_data = await queue.get() # type: LogData
queue.task_done()
if logger_debug_enabled:
logger.debug('Reporting Log %s', log_data.timestamp)
yield log_data
try:
await self.log_reporter.report(generator())
except grpc.aio.AioRpcError:
self.on_error()
raise
async def report_meter(self, queue: Queue):
async def generator():
while True:
# Let eventloop schedule blocking instead of user configuration: `config.agent_queue_timeout`
meter_data = await queue.get() # type: MeterData
queue.task_done()
if logger_debug_enabled:
logger.debug('Reporting Meter %s', meter_data.timestamp)
yield meter_data
try:
await self.meter_reporter.report(generator())
except grpc.aio.AioRpcError:
self.on_error()
raise
async def report_snapshot(self, queue: Queue):
async def generator():
while True:
# Let eventloop schedule blocking instead of user configuration: `config.agent_queue_timeout`
snapshot = await queue.get() # type: TracingThreadSnapshot
queue.task_done()
transform_snapshot = ThreadSnapshot(
taskId=str(snapshot.task_id),
traceSegmentId=str(snapshot.trace_segment_id),
time=int(snapshot.time),
sequence=int(snapshot.sequence),
stack=ThreadStack(codeSignatures=snapshot.stack_list)
)
yield transform_snapshot
try:
await self.profile_channel.report(generator())
except grpc.aio.AioRpcError:
self.on_error()
raise