pw_log/log.proto - pigweed/pigweed - Git at Google

 // Copyright 2021 The Pigweed Authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License"); you may not
 // use this file except in compliance with the License. You may obtain a copy of
 // the License at
 //
 //     https://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 // WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 // License for the specific language governing permissions and limitations under
 // the License.

 syntax = "proto3";

 package pw.log;

 import "pw_tokenizer/proto/options.proto";

 option java_outer_classname = "Log";

 // A log message and metadata. Logs come in a few different forms:
 //
 //  1. A tokenized log message (recommended for production)
 //  2. A non-tokenized log message (good for development)
 //  3. A "log missed" tombstone, indicating that some logs were dropped
 //
 // Size analysis for tokenized log messages, including each field's proto tag:
 //
 //  - message     - 6-12 bytes, depending on number and value of arguments
 //  - line_level  - 3 bytes; 4 bytes if line > 2048 (uncommon)
 //  - timestamp   - 3 bytes; assuming delta encoding
 //  - thread_name - 6 bytes
 //
 // Adding the fields gives the total proto message size:
 //
 //    6-12 bytes - log
 //    9-15 bytes - log + level + line
 //   12-18 bytes - log + level + line + timestamp
 //
 // An analysis of a project's log token database revealed the following
 // distribution of the number of arguments to log messages:
 //
 //   # args   # messages
 //     0         2,700
 //     1         2,400
 //     2         1,200
 //     3+        1,000
 //
 // Note: The below proto makes some compromises compared to what one might
 // expect for a "clean" proto design, in order to shave bytes off of the
 // messages. It is critical that the log messages are as small as possible to
 // enable storing more logs in limited memory. This is why, for example, there
 // is no separate "DroppedLog" type, or a "TokenizedLog" and "StringLog", which
 // would add at least 2 extra bytes per message
 message LogEntry {
   // The log message, which may be tokenized.
   //
   // If tokenized logging is used, implementations may encode metadata in the
   // log message rather than as separate proto fields. This reduces the size of
   // the protobuf with no overhead.
   //
   // The standard format for encoding metadata in the log message is defined by
   // the pw_log_tokenized module. The message and metadata are encoded as
   // key-value pairs using ■ and ♦ as delimiters. For example:
   //
   //  ■msg♦This is the log message: %d■module♦wifi■file♦../path/to/file.cc
   //
   // See http://pigweed.dev/pw_log_tokenized for full details. When
   // pw_log_tokenized is used, this metadata is automatically included as
   // described.
   //
   // The level and flags are not included since they may be runtime values and
   // thus cannot always be tokenized. The line number is not included because
   // line numbers change frequently and a new token is created for each line.
   //
   // Size analysis when tokenized:
   //
   //   tag+wire = 1 byte
   //   size     = 1 byte; payload will almost always be < 127 bytes
   //   payload  = N bytes; typically 4-10 in practice
   //
   // Total: 2 + N ~= 6-12 bytes
   optional bytes message = 1 [(tokenizer.format) = TOKENIZATION_OPTIONAL];

   // Packed log level and line number. Structure:
   //
   //   Level: Bottom 3 bits; level = line_level & 0x7
   //   Line: Remaining bits; line = (line_level >> 3)
   //
   // Note: This packing saves two bytes per log message in most cases compared
   // to having line and level separately; and is zero-cost if the log backend
   // omits the line number.
   optional uint32 line_level = 2;

   // Some log messages have flags to indicate attributes such as whether they
   // are from an assert or if they contain PII. The particular flags are
   // product- and implementation-dependent.
   optional uint32 flags = 3;

   // Timestamps are either specified with an absolute timestamp or relative to
   // the previous log entry.
   oneof time {
     // The absolute timestamp in implementation-defined ticks. Applications
     // determine how to interpret this on the receiving end. In the simplest
     // case, these ticks might be milliseconds or microseconds since boot.
     // Applications could also access clock information out-of-band with a
     // ClockParameters protobuf.
     int64 timestamp = 4;

     // Time since the last entry in implementation-defined ticks, as for the
     // timestamp field. This enables delta encoding when batching entries
     // together.
     //
     // Size analysis for this field including tag and varint, assuming 1 kHz
     // ticks:
     //
     //           < 127 ms gap == 127 ms      ==  7 bits == 2 bytes
     //        < 16,000 ms gap ==  16 seconds == 14 bits == 3 bytes
     //     < 2,000,000 ms gap ==  35 minutes == 21 bits == 4 bytes
     //   < 300,000,000 ms gap ==  74 hours   == 28 bits == 5 bytes
     //
     // Log bursts will thus consume just 2 bytes (tag + up to 127ms delta) for
     // the timestamp, which is a good improvement over an absolute timestamp.
     int64 time_since_last_entry = 5;
   }

   // The following fields are planned but will not be added until they are
   // needed. Protobuf field numbers over 15 use an extra byte, so these fields
   // are left out for now to avoid reserving field numbers unnecessarily.

   // When the log buffers are full but more logs come in, the logs are counted
   // and a special log message is omitted with only counts for the number of
   // messages dropped. The timestamp indicates the time that the "missed logs"
   // message was inserted into the queue.
   //
   // As an alternative to these fields, implementations may simply send a
   // message stating the drop count.
   // optional uint32 dropped = ?;
   // optional uint32 dropped_warning_or_above = ?;

   // Represents the device from which the log originated. The meaning of this
   // field is implementation defined
   // optional uint32 source_id = ?;

   // The task or thread name that created the log message. If the log was not
   // created on a thread, it should use a name appropriate to that context.
   // optional bytes thread_name = ?
   //     [(tokenizer.format) = TOKENIZATION_OPTIONAL];

   // The file path where this log was created, if not encoded in the message.
   // optional bytes file = ? [(tokenizer.format) = TOKENIZATION_OPTIONAL];

   // The PW_LOG_MODULE_NAME for this log message, if it is not encoded in the
   // message.
   // optional bytes module_name = ?
   //    [(tokenizer.format) = TOKENIZATION_OPTIONAL];

   // Some messages are associated with trace events, which may carry additional
   // contextual data. This is a tuple of a data format string which could be
   // used by the decoder to identify the data (e.g. printf-style tokens) and the
   // data itself in bytes.
   // optional bytes data_format = ?
   //     [(tokenizer.format) = TOKENIZATION_OPTIONAL];
   // optional bytes data = ?;
 }

 message LogRequest {
   // This will include fields for configuring log filtering.
 }

 message LogEntries {
   repeated LogEntry entries = 1;
 }

 // RPC service for accessing logs.
 service Logs {
   rpc Listen(LogRequest) returns (stream LogEntries);
 }
	// Copyright 2021 The Pigweed Authors
	//
	// Licensed under the Apache License, Version 2.0 (the "License"); you may not
	// use this file except in compliance with the License. You may obtain a copy of
	// the License at
	//
	// https://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
	// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
	// License for the specific language governing permissions and limitations under
	// the License.

	syntax = "proto3";

	package pw.log;

	import "pw_tokenizer/proto/options.proto";

	option java_outer_classname = "Log";

	// A log message and metadata. Logs come in a few different forms:
	//
	// 1. A tokenized log message (recommended for production)
	// 2. A non-tokenized log message (good for development)
	// 3. A "log missed" tombstone, indicating that some logs were dropped
	//
	// Size analysis for tokenized log messages, including each field's proto tag:
	//
	// - message - 6-12 bytes, depending on number and value of arguments
	// - line_level - 3 bytes; 4 bytes if line > 2048 (uncommon)
	// - timestamp - 3 bytes; assuming delta encoding
	// - thread_name - 6 bytes
	//
	// Adding the fields gives the total proto message size:
	//
	// 6-12 bytes - log
	// 9-15 bytes - log + level + line
	// 12-18 bytes - log + level + line + timestamp
	//
	// An analysis of a project's log token database revealed the following
	// distribution of the number of arguments to log messages:
	//
	// # args # messages
	// 0 2,700
	// 1 2,400
	// 2 1,200
	// 3+ 1,000
	//
	// Note: The below proto makes some compromises compared to what one might
	// expect for a "clean" proto design, in order to shave bytes off of the
	// messages. It is critical that the log messages are as small as possible to
	// enable storing more logs in limited memory. This is why, for example, there
	// is no separate "DroppedLog" type, or a "TokenizedLog" and "StringLog", which
	// would add at least 2 extra bytes per message
	message LogEntry {
	// The log message, which may be tokenized.
	//
	// If tokenized logging is used, implementations may encode metadata in the
	// log message rather than as separate proto fields. This reduces the size of
	// the protobuf with no overhead.
	//
	// The standard format for encoding metadata in the log message is defined by
	// the pw_log_tokenized module. The message and metadata are encoded as
	// key-value pairs using ■ and ♦ as delimiters. For example:
	//
	// ■msg♦This is the log message: %d■module♦wifi■file♦../path/to/file.cc
	//
	// See http://pigweed.dev/pw_log_tokenized for full details. When
	// pw_log_tokenized is used, this metadata is automatically included as
	// described.
	//
	// The level and flags are not included since they may be runtime values and
	// thus cannot always be tokenized. The line number is not included because
	// line numbers change frequently and a new token is created for each line.
	//
	// Size analysis when tokenized:
	//
	// tag+wire = 1 byte
	// size = 1 byte; payload will almost always be < 127 bytes
	// payload = N bytes; typically 4-10 in practice
	//
	// Total: 2 + N ~= 6-12 bytes
	optional bytes message = 1 [(tokenizer.format) = TOKENIZATION_OPTIONAL];

	// Packed log level and line number. Structure:
	//
	// Level: Bottom 3 bits; level = line_level & 0x7
	// Line: Remaining bits; line = (line_level >> 3)
	//
	// Note: This packing saves two bytes per log message in most cases compared
	// to having line and level separately; and is zero-cost if the log backend
	// omits the line number.
	optional uint32 line_level = 2;

	// Some log messages have flags to indicate attributes such as whether they
	// are from an assert or if they contain PII. The particular flags are
	// product- and implementation-dependent.
	optional uint32 flags = 3;

	// Timestamps are either specified with an absolute timestamp or relative to
	// the previous log entry.
	oneof time {
	// The absolute timestamp in implementation-defined ticks. Applications
	// determine how to interpret this on the receiving end. In the simplest
	// case, these ticks might be milliseconds or microseconds since boot.
	// Applications could also access clock information out-of-band with a
	// ClockParameters protobuf.
	int64 timestamp = 4;

	// Time since the last entry in implementation-defined ticks, as for the
	// timestamp field. This enables delta encoding when batching entries
	// together.
	//
	// Size analysis for this field including tag and varint, assuming 1 kHz
	// ticks:
	//
	// < 127 ms gap == 127 ms == 7 bits == 2 bytes
	// < 16,000 ms gap == 16 seconds == 14 bits == 3 bytes
	// < 2,000,000 ms gap == 35 minutes == 21 bits == 4 bytes
	// < 300,000,000 ms gap == 74 hours == 28 bits == 5 bytes
	//
	// Log bursts will thus consume just 2 bytes (tag + up to 127ms delta) for
	// the timestamp, which is a good improvement over an absolute timestamp.
	int64 time_since_last_entry = 5;
	}

	// The following fields are planned but will not be added until they are
	// needed. Protobuf field numbers over 15 use an extra byte, so these fields
	// are left out for now to avoid reserving field numbers unnecessarily.

	// When the log buffers are full but more logs come in, the logs are counted
	// and a special log message is omitted with only counts for the number of
	// messages dropped. The timestamp indicates the time that the "missed logs"
	// message was inserted into the queue.
	//
	// As an alternative to these fields, implementations may simply send a
	// message stating the drop count.
	// optional uint32 dropped = ?;
	// optional uint32 dropped_warning_or_above = ?;

	// Represents the device from which the log originated. The meaning of this
	// field is implementation defined
	// optional uint32 source_id = ?;

	// The task or thread name that created the log message. If the log was not
	// created on a thread, it should use a name appropriate to that context.
	// optional bytes thread_name = ?
	// [(tokenizer.format) = TOKENIZATION_OPTIONAL];

	// The file path where this log was created, if not encoded in the message.
	// optional bytes file = ? [(tokenizer.format) = TOKENIZATION_OPTIONAL];

	// The PW_LOG_MODULE_NAME for this log message, if it is not encoded in the
	// message.
	// optional bytes module_name = ?
	// [(tokenizer.format) = TOKENIZATION_OPTIONAL];

	// Some messages are associated with trace events, which may carry additional
	// contextual data. This is a tuple of a data format string which could be
	// used by the decoder to identify the data (e.g. printf-style tokens) and the
	// data itself in bytes.
	// optional bytes data_format = ?
	// [(tokenizer.format) = TOKENIZATION_OPTIONAL];
	// optional bytes data = ?;
	}

	message LogRequest {
	// This will include fields for configuring log filtering.
	}

	message LogEntries {
	repeated LogEntry entries = 1;
	}

	// RPC service for accessing logs.
	service Logs {
	rpc Listen(LogRequest) returns (stream LogEntries);
	}