src/google/protobuf/compiler/cpp/helpers.h - third_party/github/protocolbuffers/protobuf - Git at Google

 // Protocol Buffers - Google's data interchange format
 // Copyright 2008 Google Inc.  All rights reserved.
 //
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file or at
 // https://developers.google.com/open-source/licenses/bsd

 // Author: kenton@google.com (Kenton Varda)
 //  Based on original Protocol Buffers design by
 //  Sanjay Ghemawat, Jeff Dean, and others.

 #ifndef GOOGLE_PROTOBUF_COMPILER_CPP_HELPERS_H__
 #define GOOGLE_PROTOBUF_COMPILER_CPP_HELPERS_H__

 #include <iterator>
 #include <string>
 #include <tuple>
 #include <vector>

 #include "absl/container/flat_hash_map.h"
 #include "absl/log/absl_check.h"
 #include "absl/strings/str_cat.h"
 #include "absl/strings/str_split.h"
 #include "absl/strings/string_view.h"
 #include "absl/types/optional.h"
 #include "google/protobuf/compiler/code_generator.h"
 #include "google/protobuf/compiler/cpp/names.h"
 #include "google/protobuf/compiler/cpp/options.h"
 #include "google/protobuf/compiler/scc.h"
 #include "google/protobuf/descriptor.h"
 #include "google/protobuf/descriptor.pb.h"
 #include "google/protobuf/io/printer.h"
 #include "google/protobuf/port.h"


 // Must be included last.
 #include "google/protobuf/port_def.inc"

 namespace google {
 namespace protobuf {
 namespace compiler {
 namespace cpp {
 enum class ArenaDtorNeeds { kNone = 0, kOnDemand = 1, kRequired = 2 };

 inline absl::string_view ProtobufNamespace(const Options& opts) {
   // This won't be transformed by copybara, since copybara looks for google::protobuf::.
   constexpr absl::string_view kGoogle3Ns = "proto2";
   constexpr absl::string_view kOssNs = "google::protobuf";

   return opts.opensource_runtime ? kOssNs : kGoogle3Ns;
 }

 inline std::string MacroPrefix(const Options& options) {
   // Constants are different in the internal and external version.
   return options.opensource_runtime ? "GOOGLE_PROTOBUF" : "GOOGLE_PROTOBUF";
 }

 inline std::string DeprecatedAttribute(const Options&,
                                        const FieldDescriptor* d) {
   return d->options().deprecated() ? "[[deprecated]] " : "";
 }

 inline std::string DeprecatedAttribute(const Options&,
                                        const EnumValueDescriptor* d) {
   return d->options().deprecated() ? "[[deprecated]] " : "";
 }

 // Commonly-used separator comments.  Thick is a line of '=', thin is a line
 // of '-'.
 extern const char kThickSeparator[];
 extern const char kThinSeparator[];

 absl::flat_hash_map<absl::string_view, std::string> MessageVars(
     const Descriptor* desc);

 // Variables to access message data from the message scope.
 void SetCommonMessageDataVariables(
     const Descriptor* descriptor,
     absl::flat_hash_map<absl::string_view, std::string>* variables);

 absl::flat_hash_map<absl::string_view, std::string> UnknownFieldsVars(
     const Descriptor* desc, const Options& opts);

 void SetUnknownFieldsVariable(
     const Descriptor* descriptor, const Options& options,
     absl::flat_hash_map<absl::string_view, std::string>* variables);

 bool GetBootstrapBasename(const Options& options, absl::string_view basename,
                           std::string* bootstrap_basename);
 bool MaybeBootstrap(const Options& options, GeneratorContext* generator_context,
                     bool bootstrap_flag, std::string* basename);
 bool IsBootstrapProto(const Options& options, const FileDescriptor* file);

 // Name space of the proto file. This namespace is such that the string
 // "<namespace>::some_name" is the correct fully qualified namespace.
 // This means if the package is empty the namespace is "", and otherwise
 // the namespace is "::foo::bar::...::baz" without trailing semi-colons.
 std::string Namespace(const FileDescriptor* d, const Options& options);
 std::string Namespace(const Descriptor* d, const Options& options);
 std::string Namespace(const FieldDescriptor* d, const Options& options);
 std::string Namespace(const EnumDescriptor* d, const Options& options);
 PROTOC_EXPORT std::string Namespace(const FileDescriptor* d);
 PROTOC_EXPORT std::string Namespace(const Descriptor* d);
 PROTOC_EXPORT std::string Namespace(const FieldDescriptor* d);
 PROTOC_EXPORT std::string Namespace(const EnumDescriptor* d);

 class MessageSCCAnalyzer;

 // Returns true if it's safe to init "field" to zero.
 bool CanInitializeByZeroing(const FieldDescriptor* field,
                             const Options& options,
                             MessageSCCAnalyzer* scc_analyzer);
 // Returns true if it's safe to reset "field" to zero.
 bool CanClearByZeroing(const FieldDescriptor* field);
 // Determines if swap can be implemented via memcpy.
 bool HasTrivialSwap(const FieldDescriptor* field, const Options& options,
                     MessageSCCAnalyzer* scc_analyzer);

 PROTOC_EXPORT std::string ClassName(const Descriptor* descriptor);
 PROTOC_EXPORT std::string ClassName(const EnumDescriptor* enum_descriptor);

 std::string QualifiedClassName(const Descriptor* d, const Options& options);
 std::string QualifiedClassName(const EnumDescriptor* d, const Options& options);

 PROTOC_EXPORT std::string QualifiedClassName(const Descriptor* d);
 PROTOC_EXPORT std::string QualifiedClassName(const EnumDescriptor* d);

 // DEPRECATED just use ClassName or QualifiedClassName, a boolean is very
 // unreadable at the callsite.
 // Returns the non-nested type name for the given type.  If "qualified" is
 // true, prefix the type with the full namespace.  For example, if you had:
 //   package foo.bar;
 //   message Baz { message Moo {} }
 // Then the qualified ClassName for Moo would be:
 //   ::foo::bar::Baz_Moo
 // While the non-qualified version would be:
 //   Baz_Moo
 inline std::string ClassName(const Descriptor* descriptor, bool qualified) {
   return qualified ? QualifiedClassName(descriptor, Options())
                    : ClassName(descriptor);
 }

 inline std::string ClassName(const EnumDescriptor* descriptor, bool qualified) {
   return qualified ? QualifiedClassName(descriptor, Options())
                    : ClassName(descriptor);
 }

 // Returns the extension name prefixed with the class name if nested but without
 // the package name.
 std::string ExtensionName(const FieldDescriptor* d);

 std::string QualifiedExtensionName(const FieldDescriptor* d,
                                    const Options& options);
 std::string QualifiedExtensionName(const FieldDescriptor* d);

 // Type name of default instance.
 std::string DefaultInstanceType(const Descriptor* descriptor,
                                 const Options& options, bool split = false);

 // Non-qualified name of the default_instance of this message.
 std::string DefaultInstanceName(const Descriptor* descriptor,
                                 const Options& options, bool split = false);

 // Non-qualified name of the default instance pointer. This is used only for
 // implicit weak fields, where we need an extra indirection.
 std::string DefaultInstancePtr(const Descriptor* descriptor,
                                const Options& options, bool split = false);

 // Fully qualified name of the default_instance of this message.
 std::string QualifiedDefaultInstanceName(const Descriptor* descriptor,
                                          const Options& options,
                                          bool split = false);

 // Fully qualified name of the default instance pointer.
 std::string QualifiedDefaultInstancePtr(const Descriptor* descriptor,
                                         const Options& options,
                                         bool split = false);

 // DescriptorTable variable name.
 std::string DescriptorTableName(const FileDescriptor* file,
                                 const Options& options);

 // When declaring symbol externs from another file, this macro will supply the
 // dllexport needed for the target file, if any.
 std::string FileDllExport(const FileDescriptor* file, const Options& options);

 // Name of the base class: google::protobuf::Message or google::protobuf::MessageLite.
 std::string SuperClassName(const Descriptor* descriptor,
                            const Options& options);

 // Adds an underscore if necessary to prevent conflicting with a keyword.
 std::string ResolveKeyword(absl::string_view name);

 // Get the (unqualified) name that should be used for this field in C++ code.
 // The name is coerced to lower-case to emulate proto1 behavior.  People
 // should be using lowercase-with-underscores style for proto field names
 // anyway, so normally this just returns field->name().
 PROTOC_EXPORT std::string FieldName(const FieldDescriptor* field);

 // Returns the (unqualified) private member name for this field in C++ code.
 std::string FieldMemberName(const FieldDescriptor* field, bool split);

 // Returns an estimate of the compiler's alignment for the field.  This
 // can't guarantee to be correct because the generated code could be compiled on
 // different systems with different alignment rules.  The estimates below assume
 // 64-bit pointers.
 int EstimateAlignmentSize(const FieldDescriptor* field);

 // Returns an estimate of the size of the field.  This
 // can't guarantee to be correct because the generated code could be compiled on
 // different systems with different alignment rules.  The estimates below assume
 // 64-bit pointers.
 int EstimateSize(const FieldDescriptor* field);

 // Get the unqualified name that should be used for a field's field
 // number constant.
 std::string FieldConstantName(const FieldDescriptor* field);

 // Returns the scope where the field was defined (for extensions, this is
 // different from the message type to which the field applies).
 inline const Descriptor* FieldScope(const FieldDescriptor* field) {
   return field->is_extension() ? field->extension_scope()
                                : field->containing_type();
 }

 // Returns the fully-qualified type name field->message_type().  Usually this
 // is just ClassName(field->message_type(), true);
 std::string FieldMessageTypeName(const FieldDescriptor* field,
                                  const Options& options);

 // Get the C++ type name for a primitive type (e.g. "double", "::int32", etc.).
 const char* PrimitiveTypeName(FieldDescriptor::CppType type);
 std::string PrimitiveTypeName(const Options& options,
                               FieldDescriptor::CppType type);

 // Get the declared type name in CamelCase format, as is used e.g. for the
 // methods of WireFormat.  For example, TYPE_INT32 becomes "Int32".
 const char* DeclaredTypeMethodName(FieldDescriptor::Type type);

 // Return the code that evaluates to the number when compiled.
 std::string Int32ToString(int number);

 // Get code that evaluates to the field's default value.
 std::string DefaultValue(const Options& options, const FieldDescriptor* field);

 // Compatibility function for callers outside proto2.
 std::string DefaultValue(const FieldDescriptor* field);

 // Convert a file name into a valid identifier.
 std::string FilenameIdentifier(absl::string_view filename);

 // For each .proto file generates a unique name. To prevent collisions of
 // symbols in the global namespace
 std::string UniqueName(absl::string_view name, absl::string_view filename,
                        const Options& options);
 inline std::string UniqueName(absl::string_view name, const FileDescriptor* d,
                               const Options& options) {
   return UniqueName(name, d->name(), options);
 }
 inline std::string UniqueName(absl::string_view name, const Descriptor* d,
                               const Options& options) {
   return UniqueName(name, d->file(), options);
 }
 inline std::string UniqueName(absl::string_view name, const EnumDescriptor* d,
                               const Options& options) {
   return UniqueName(name, d->file(), options);
 }
 inline std::string UniqueName(absl::string_view name,
                               const ServiceDescriptor* d,
                               const Options& options) {
   return UniqueName(name, d->file(), options);
 }

 // Versions for call sites that only support the internal runtime (like proto1
 // support).
 inline Options InternalRuntimeOptions() {
   Options options;
   options.opensource_runtime = false;
   return options;
 }
 inline std::string UniqueName(absl::string_view name,
                               absl::string_view filename) {
   return UniqueName(name, filename, InternalRuntimeOptions());
 }
 inline std::string UniqueName(absl::string_view name, const FileDescriptor* d) {
   return UniqueName(name, d->name(), InternalRuntimeOptions());
 }
 inline std::string UniqueName(absl::string_view name, const Descriptor* d) {
   return UniqueName(name, d->file(), InternalRuntimeOptions());
 }
 inline std::string UniqueName(absl::string_view name, const EnumDescriptor* d) {
   return UniqueName(name, d->file(), InternalRuntimeOptions());
 }
 inline std::string UniqueName(absl::string_view name,
                               const ServiceDescriptor* d) {
   return UniqueName(name, d->file(), InternalRuntimeOptions());
 }

 // Return the qualified C++ name for a file level symbol.
 std::string QualifiedFileLevelSymbol(const FileDescriptor* file,
                                      absl::string_view name,
                                      const Options& options);

 // Escape C++ trigraphs by escaping question marks to \?
 std::string EscapeTrigraphs(absl::string_view to_escape);

 // Escaped function name to eliminate naming conflict.
 std::string SafeFunctionName(const Descriptor* descriptor,
                              const FieldDescriptor* field,
                              absl::string_view prefix);

 // Returns the optimize mode for <file>, respecting <options.enforce_lite>.
 FileOptions_OptimizeMode GetOptimizeFor(const FileDescriptor* file,
                                         const Options& options);

 // Determines whether unknown fields will be stored in an UnknownFieldSet or
 // a string.
 inline bool UseUnknownFieldSet(const FileDescriptor* file,
                                const Options& options) {
   return GetOptimizeFor(file, options) != FileOptions::LITE_RUNTIME;
 }

 inline bool IsWeak(const FieldDescriptor* field, const Options& options) {
   if (field->options().weak()) {
     ABSL_CHECK(!options.opensource_runtime);
     return true;
   }
   return false;
 }

 inline bool IsCord(const FieldDescriptor* field) {
   return field->cpp_type() == FieldDescriptor::CPPTYPE_STRING &&
          internal::cpp::EffectiveStringCType(field) == FieldOptions::CORD;
 }

 inline bool IsString(const FieldDescriptor* field) {
   return field->cpp_type() == FieldDescriptor::CPPTYPE_STRING &&
          internal::cpp::EffectiveStringCType(field) == FieldOptions::STRING;
 }

 inline bool IsStringPiece(const FieldDescriptor* field) {
   return field->cpp_type() == FieldDescriptor::CPPTYPE_STRING &&
          internal::cpp::EffectiveStringCType(field) ==
              FieldOptions::STRING_PIECE;
 }

 bool IsProfileDriven(const Options& options);

 // Returns true if `field` is unlikely to be present based on PDProto profile.
 bool IsRarelyPresent(const FieldDescriptor* field, const Options& options);

 // Returns true if `field` is likely to be present based on PDProto profile.
 bool IsLikelyPresent(const FieldDescriptor* field, const Options& options);

 float GetPresenceProbability(const FieldDescriptor* field,
                              const Options& options);

 bool IsStringInliningEnabled(const Options& options);

 // Returns true if the provided field is a singular string and can be inlined.
 bool CanStringBeInlined(const FieldDescriptor* field);

 // Returns true if `field` is a string field that can and should be inlined
 // based on PDProto profile.
 bool IsStringInlined(const FieldDescriptor* field, const Options& options);

 // Returns true if `field` should be inlined based on PDProto profile.
 // Currently we only enable inlining for string fields backed by a std::string
 // instance, but in the future we may expand this to message types.
 inline bool IsFieldInlined(const FieldDescriptor* field,
                            const Options& options) {
   return IsStringInlined(field, options);
 }

 // Does the given FileDescriptor use lazy fields?
 bool HasLazyFields(const FileDescriptor* file, const Options& options,
                    MessageSCCAnalyzer* scc_analyzer);

 // Is the given field a supported lazy field?
 bool IsLazy(const FieldDescriptor* field, const Options& options,
             MessageSCCAnalyzer* scc_analyzer);

 // Is this an explicit (non-profile driven) lazy field, as denoted by
 // lazy/unverified_lazy in the descriptor?
 inline bool IsExplicitLazy(const FieldDescriptor* field) {
   if (field->is_map() || field->is_repeated()) {
     return false;
   }

   if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) {
     return false;
   }

   return field->options().lazy() || field->options().unverified_lazy();
 }

 bool IsEagerlyVerifiedLazy(const FieldDescriptor* field, const Options& options,
                            MessageSCCAnalyzer* scc_analyzer);

 bool IsLazilyVerifiedLazy(const FieldDescriptor* field, const Options& options);

 bool ShouldVerify(const Descriptor* descriptor, const Options& options,
                   MessageSCCAnalyzer* scc_analyzer);
 bool ShouldVerify(const FileDescriptor* file, const Options& options,
                   MessageSCCAnalyzer* scc_analyzer);
 bool ShouldVerifyRecursively(const FieldDescriptor* field);

 // Indicates whether to use predefined verify methods for a given message. If a
 // message is "simple" and needs no special verification per field (e.g. message
 // field, repeated packed, UTF8 string, etc.), we can use either VerifySimple or
 // VerifySimpleAlwaysCheckInt32 methods as all verification can be done based on
 // the wire type.
 //
 // Otherwise, we need "custom" verify methods tailored to a message to pass
 // which field needs a special verification; i.e. InternalVerify.
 enum class VerifySimpleType {
   kSimpleInt32Never,   // Use VerifySimple
   kSimpleInt32Always,  // Use VerifySimpleAlwaysCheckInt32
   kCustom,             // Use InternalVerify and check only for int32
   kCustomInt32Never,   // Use InternalVerify but never check for int32
   kCustomInt32Always,  // Use InternalVerify and always check for int32
 };

 // Returns VerifySimpleType if messages can be verified by predefined methods.
 VerifySimpleType ShouldVerifySimple(const Descriptor* descriptor);


 // Is the given message being split (go/pdsplit)?
 bool ShouldSplit(const Descriptor* desc, const Options& options);

 // Is the given field being split out?
 bool ShouldSplit(const FieldDescriptor* field, const Options& options);

 // Should we generate code that force creating an allocation in the constructor
 // of the given message?
 bool ShouldForceAllocationOnConstruction(const Descriptor* desc,
                                          const Options& options);

 // Returns true if the message is present based on PDProto profile.
 bool IsPresentMessage(const Descriptor* descriptor, const Options& options);

 // Returns the most likely present field. Returns nullptr if not profile driven.
 const FieldDescriptor* FindHottestField(
     const std::vector<const FieldDescriptor*>& fields, const Options& options);

 // Does the file contain any definitions that need extension_set.h?
 bool HasExtensionsOrExtendableMessage(const FileDescriptor* file);

 // Does the file have any repeated fields, necessitating the file to include
 // repeated_field.h? This does not include repeated extensions, since those are
 // all stored internally in an ExtensionSet, not a separate RepeatedField*.
 bool HasRepeatedFields(const FileDescriptor* file);

 // Does the file have any string/bytes fields with ctype=STRING_PIECE? This
 // does not include extensions, since ctype is ignored for extensions.
 bool HasStringPieceFields(const FileDescriptor* file, const Options& options);

 // Does the file have any string/bytes fields with ctype=CORD? This does not
 // include extensions, since ctype is ignored for extensions.
 bool HasCordFields(const FileDescriptor* file, const Options& options);

 // Does the file have any map fields, necessitating the file to include
 // map_field_inl.h and map.h.
 bool HasMapFields(const FileDescriptor* file);

 // Does this file have any enum type definitions?
 bool HasEnumDefinitions(const FileDescriptor* file);

 // Does this file have generated parsing, serialization, and other
 // standard methods for which reflection-based fallback implementations exist?
 inline bool HasGeneratedMethods(const FileDescriptor* file,
                                 const Options& options) {
   return GetOptimizeFor(file, options) != FileOptions::CODE_SIZE;
 }

 // Do message classes in this file have descriptor and reflection methods?
 inline bool HasDescriptorMethods(const FileDescriptor* file,
                                  const Options& options) {
   return GetOptimizeFor(file, options) != FileOptions::LITE_RUNTIME;
 }

 // Should we generate generic services for this file?
 inline bool HasGenericServices(const FileDescriptor* file,
                                const Options& options) {
   return file->service_count() > 0 &&
          GetOptimizeFor(file, options) != FileOptions::LITE_RUNTIME &&
          file->options().cc_generic_services();
 }

 inline bool IsProto2MessageSet(const Descriptor* descriptor,
                                const Options& options) {
   return !options.opensource_runtime &&
          options.enforce_mode != EnforceOptimizeMode::kLiteRuntime &&
          !options.lite_implicit_weak_fields &&
          descriptor->options().message_set_wire_format() &&
          descriptor->full_name() == "google.protobuf.bridge.MessageSet";
 }

 inline bool IsMapEntryMessage(const Descriptor* descriptor) {
   return descriptor->options().map_entry();
 }

 // Returns true if the field's CPPTYPE is string or message.
 bool IsStringOrMessage(const FieldDescriptor* field);

 std::string UnderscoresToCamelCase(absl::string_view input,
                                    bool cap_next_letter);

 inline bool IsCrossFileMessage(const FieldDescriptor* field) {
   return field->type() == FieldDescriptor::TYPE_MESSAGE &&
          field->message_type()->file() != field->file();
 }

 inline std::string MakeDefaultName(const FieldDescriptor* field) {
   return absl::StrCat("_i_give_permission_to_break_this_code_default_",
                       FieldName(field), "_");
 }

 // Semantically distinct from MakeDefaultName in that it gives the C++ code
 // referencing a default field from the message scope, rather than just the
 // variable name.
 // For example, declarations of default variables should always use just
 // MakeDefaultName to produce code like:
 //   Type _i_give_permission_to_break_this_code_default_field_;
 //
 // Code that references these should use MakeDefaultFieldName, in case the field
 // exists at some nested level like:
 //   internal_container_._i_give_permission_to_break_this_code_default_field_;
 inline std::string MakeDefaultFieldName(const FieldDescriptor* field) {
   return absl::StrCat("Impl_::", MakeDefaultName(field));
 }

 inline std::string MakeVarintCachedSizeName(const FieldDescriptor* field) {
   return absl::StrCat("_", FieldName(field), "_cached_byte_size_");
 }

 // Semantically distinct from MakeVarintCachedSizeName in that it gives the C++
 // code referencing the object from the message scope, rather than just the
 // variable name.
 // For example, declarations of default variables should always use just
 // MakeVarintCachedSizeName to produce code like:
 //   Type _field_cached_byte_size_;
 //
 // Code that references these variables should use
 // MakeVarintCachedSizeFieldName, in case the field exists at some nested level
 // like:
 //   internal_container_._field_cached_byte_size_;
 inline std::string MakeVarintCachedSizeFieldName(const FieldDescriptor* field,
                                                  bool split) {
   return absl::StrCat("_impl_.", split ? "_split_->" : "", "_",
                       FieldName(field), "_cached_byte_size_");
 }

 // Note: A lot of libraries detect Any protos based on Descriptor::full_name()
 // while the two functions below use FileDescriptor::name(). In a sane world the
 // two approaches should be equivalent. But if you are dealing with descriptors
 // from untrusted sources, you might need to match semantics across libraries.
 bool IsAnyMessage(const FileDescriptor* descriptor);
 bool IsAnyMessage(const Descriptor* descriptor);

 bool IsWellKnownMessage(const FileDescriptor* descriptor);

 enum class GeneratedFileType : int { kPbH, kProtoH, kProtoStaticReflectionH };

 inline std::string IncludeGuard(const FileDescriptor* file,
                                 GeneratedFileType file_type,
                                 const Options& options) {
   // If we are generating a .pb.h file and the proto_h option is enabled, then
   // the .pb.h gets an extra suffix.
   std::string extension;
   switch (file_type) {
     case GeneratedFileType::kPbH:
       extension = ".pb.h";
       break;
     case GeneratedFileType::kProtoH:
       extension = ".proto.h";
       break;
     case GeneratedFileType::kProtoStaticReflectionH:
       extension = ".proto.static_reflection.h";
   }
   std::string filename_identifier =
       FilenameIdentifier(file->name() + extension);

   if (IsWellKnownMessage(file)) {
     // For well-known messages we need third_party/protobuf and net/proto2 to
     // have distinct include guards, because some source files include both and
     // both need to be defined (the third_party copies will be in the
     // google::protobuf_opensource namespace).
     return absl::StrCat(MacroPrefix(options), "_INCLUDED_",
                         filename_identifier);
   } else {
     // Ideally this case would use distinct include guards for opensource and
     // google3 protos also.  (The behavior of "first #included wins" is not
     // ideal).  But unfortunately some legacy code includes both and depends on
     // the identical include guards to avoid compile errors.
     //
     // We should clean this up so that this case can be removed.
     return absl::StrCat("GOOGLE_PROTOBUF_INCLUDED_", filename_identifier);
   }
 }

 // Returns the OptimizeMode for this file, furthermore it updates a status
 // bool if has_opt_codesize_extension is non-null. If this status bool is true
 // it means this file contains an extension that itself is defined as
 // optimized_for = CODE_SIZE.
 FileOptions_OptimizeMode GetOptimizeFor(const FileDescriptor* file,
                                         const Options& options,
                                         bool* has_opt_codesize_extension);
 inline FileOptions_OptimizeMode GetOptimizeFor(const FileDescriptor* file,
                                                const Options& options) {
   return GetOptimizeFor(file, options, nullptr);
 }
 inline bool NeedsEagerDescriptorAssignment(const FileDescriptor* file,
                                            const Options& options) {
   bool has_opt_codesize_extension;
   if (GetOptimizeFor(file, options, &has_opt_codesize_extension) ==
           FileOptions::CODE_SIZE &&
       has_opt_codesize_extension) {
     // If this filedescriptor contains an extension from another file which
     // is optimized_for = CODE_SIZE. We need to be careful in the ordering so
     // we eagerly build the descriptors in the dependencies before building
     // the descriptors of this file.
     return true;
   } else {
     // If we have a generated code based parser we never need eager
     // initialization of descriptors of our deps.
     return false;
   }
 }

 // This orders the messages in a .pb.cc as it's outputted by file.cc
 void FlattenMessagesInFile(const FileDescriptor* file,
                            std::vector<const Descriptor*>* result);
 inline std::vector<const Descriptor*> FlattenMessagesInFile(
     const FileDescriptor* file) {
   std::vector<const Descriptor*> result;
   FlattenMessagesInFile(file, &result);
   return result;
 }

 std::vector<const Descriptor*> TopologicalSortMessagesInFile(
     const FileDescriptor* file, MessageSCCAnalyzer& scc_analyzer);

 bool HasWeakFields(const Descriptor* desc, const Options& options);
 bool HasWeakFields(const FileDescriptor* desc, const Options& options);

 // Returns true if the "required" restriction check should be ignored for the
 // given field.
 inline static bool ShouldIgnoreRequiredFieldCheck(const FieldDescriptor* field,
                                                   const Options& options) {
   // Do not check "required" for lazily verified lazy fields.
   return IsLazilyVerifiedLazy(field, options);
 }

 struct MessageAnalysis {
   bool is_recursive = false;
   bool contains_cord = false;
   bool contains_extension = false;
   bool contains_required = false;
   bool contains_weak = false;  // Implicit weak as well.
 };

 // This class is used in FileGenerator, to ensure linear instead of
 // quadratic performance, if we do this per message we would get O(V*(V+E)).
 // Logically this is just only used in message.cc, but in the header for
 // FileGenerator to help share it.
 class PROTOC_EXPORT MessageSCCAnalyzer {
  public:
   explicit MessageSCCAnalyzer(const Options& options) : options_(options) {}

   MessageAnalysis GetSCCAnalysis(const SCC* scc);

   bool HasRequiredFields(const Descriptor* descriptor) {
     MessageAnalysis result = GetSCCAnalysis(GetSCC(descriptor));
     return result.contains_required || result.contains_extension;
   }
   bool HasWeakField(const Descriptor* descriptor) {
     MessageAnalysis result = GetSCCAnalysis(GetSCC(descriptor));
     return result.contains_weak;
   }
   const SCC* GetSCC(const Descriptor* descriptor) {
     return analyzer_.GetSCC(descriptor);
   }

  private:
   struct DepsGenerator {
     std::vector<const Descriptor*> operator()(const Descriptor* desc) const {
       std::vector<const Descriptor*> deps;
       for (int i = 0; i < desc->field_count(); i++) {
         if (desc->field(i)->message_type()) {
           deps.push_back(desc->field(i)->message_type());
         }
       }
       return deps;
     }
   };
   SCCAnalyzer<DepsGenerator> analyzer_;
   Options options_;
   absl::flat_hash_map<const SCC*, MessageAnalysis> analysis_cache_;
 };

 void ListAllFields(const Descriptor* d,
                    std::vector<const FieldDescriptor*>* fields);
 void ListAllFields(const FileDescriptor* d,
                    std::vector<const FieldDescriptor*>* fields);

 template <class T>
 void ForEachField(const Descriptor* d, T&& func) {
   for (int i = 0; i < d->nested_type_count(); i++) {
     ForEachField(d->nested_type(i), std::forward<T&&>(func));
   }
   for (int i = 0; i < d->extension_count(); i++) {
     func(d->extension(i));
   }
   for (int i = 0; i < d->field_count(); i++) {
     func(d->field(i));
   }
 }

 template <class T>
 void ForEachField(const FileDescriptor* d, T&& func) {
   for (int i = 0; i < d->message_type_count(); i++) {
     ForEachField(d->message_type(i), std::forward<T&&>(func));
   }
   for (int i = 0; i < d->extension_count(); i++) {
     func(d->extension(i));
   }
 }

 void ListAllTypesForServices(const FileDescriptor* fd,
                              std::vector<const Descriptor*>* types);

 // Whether this type should use the implicit weak feature for descriptor based
 // objects.
 //
 // This feature allows tree shaking within a single translation unit by
 // decoupling the messages from the TU-wide `file_default_instances` array.
 // This way there are no static initializers in the TU pointing to any part of
 // the generated classes and they can be GC'd by the linker.
 // Instead of direct use, we have two ways to weakly refer to the default
 // instances:
 //  - Each default instance is located on its own section, and we use a
 //    `&__start_section_name` pointer to access it. This is a reference that
 //    allows GC to happen. This step is used with dynamic linking.
 //  - We also allow merging all these sections at link time into the
 //    `pb_defaults` section. All surviving messages will be injected back into
 //    the `file_default_instances` when the runtime is initialized. This is
 //    useful when doing static linking and you want to avoid having an unbounded
 //    number of sections.
 //
 // Any object that gets GC'd will have a `nullptr` in the respective slot in the
 // `file_default_instances` array. The runtime will recognize this and will
 // dynamically generate the object if needed. This logic is in the
 // `GeneratedMessageFactory::GetPrototype`.  It will fall back to a
 // `DynamicMessage` for the missing objects.
 // This allows all of reflection to keep working normally, even for types that
 // were dropped. Note that dropping the _classes_ will not drop the descriptor
 // information. The messages are still going to be registered in the generated
 // `DescriptorPool` and will be available via normal `FindMessageTypeByName` and
 // friends.
 //
 // A "pin" is adding dependency edge in the graph for the GC.
 // The default instance and vtable of a message pin each other. If any one
 // lives, they both do. This is important. The default instance of the message
 // pins the vtable trivially by using it. The vtable pins the default instance
 // by having a StrongPointer into it from any of the virtual functions.
 //
 // All parent messages pin their children.
 // SPEED messages do this implicitly via the TcParseTable, which contain
 // pointers to the submessages.
 // CODE_SIZE messages explicitly add a pin via `StrongPointer` somewhere in
 // their codegen.
 // LITE messages do not participate at all in this feature.
 //
 // For extensions, the identifiers currently pin the extendee. The extended is
 // assumed to by pinned elsewhere since we already have an instance of it when
 // we call `.GetExtension` et al. The extension identifier itself is not
 // automatically pinned, so it has to be used to participate in the graph.
 // Registration of the extensions do not pin the extended or the extendee. At
 // registration time we will eagerly create a prototype object if one is
 // missing to insert in the extension table in ExtensionSet.
 //
 // For services, the TU unconditionally pins the request/response objects.
 // This is the status quo for simplicitly to avoid modifying the RPC layer. It
 // might be improved in the future.
 bool UsingImplicitWeakDescriptor(const FileDescriptor* file,
                                  const Options& options);

 // Generate the section name to be used for a data object when using implicit
 // weak descriptors. The prefix determines the kind of object and the section it
 // will be merged into afterwards.
 // See `UsingImplicitWeakDescriptor` above.
 std::string WeakDescriptorDataSection(absl::string_view prefix,
                                       const Descriptor* descriptor,
                                       int index_in_file_messages,
                                       const Options& options);

 // Section name to be used for the default instance for implicit weak descriptor
 // objects. See `UsingImplicitWeakDescriptor` above.
 inline std::string WeakDefaultInstanceSection(const Descriptor* descriptor,
                                               int index_in_file_messages,
                                               const Options& options) {
   return WeakDescriptorDataSection("def", descriptor, index_in_file_messages,
                                    options);
 }

 // Indicates whether we should use implicit weak fields for this file.
 bool UsingImplicitWeakFields(const FileDescriptor* file,
                              const Options& options);

 // Indicates whether to treat this field as implicitly weak.
 bool IsImplicitWeakField(const FieldDescriptor* field, const Options& options,
                          MessageSCCAnalyzer* scc_analyzer);

 inline std::string SimpleBaseClass(const Descriptor* desc,
                                    const Options& options) {
   // The only base class we have derived from `Message`.
   if (!HasDescriptorMethods(desc->file(), options)) return "";
   // We don't use the base class to be able to inject the weak descriptor pins.
   if (UsingImplicitWeakDescriptor(desc->file(), options)) return "";
   if (desc->extension_range_count() != 0) return "";
   // Don't use a simple base class if the field tracking is enabled. This
   // ensures generating all methods to track.
   if (options.field_listener_options.inject_field_listener_events) return "";
   if (desc->field_count() == 0) {
     return "ZeroFieldsBase";
   }
   // TODO: Support additional common message types with only one
   // or two fields
   return "";
 }

 inline bool HasSimpleBaseClass(const Descriptor* desc, const Options& options) {
   return !SimpleBaseClass(desc, options).empty();
 }

 inline bool HasSimpleBaseClasses(const FileDescriptor* file,
                                  const Options& options) {
   return internal::cpp::VisitDescriptorsInFileOrder(
       file, [&](const Descriptor* desc) {
         return HasSimpleBaseClass(desc, options);
       });
 }

 // Returns true if this message has a _tracker_ field.
 inline bool HasTracker(const Descriptor* desc, const Options& options) {
   return options.field_listener_options.inject_field_listener_events &&
          desc->file()->options().optimize_for() !=
              google::protobuf::FileOptions::LITE_RUNTIME &&
          !IsMapEntryMessage(desc);
 }

 // Returns true if this message needs an Impl_ struct for it's data.
 inline bool HasImplData(const Descriptor* desc, const Options& options) {
   return !HasSimpleBaseClass(desc, options);
 }

 // DO NOT USE IN NEW CODE! Use io::Printer directly instead. See b/242326974.
 //
 // Formatter is a functor class which acts as a closure around printer and
 // the variable map. It's much like printer->Print except it supports both named
 // variables that are substituted using a key value map and direct arguments. In
 // the format string $1$, $2$, etc... are substituted for the first, second, ...
 // direct argument respectively in the format call, it accepts both strings and
 // integers. The implementation verifies all arguments are used and are "first"
 // used in order of appearance in the argument list. For example,
 //
 // Format("return array[$1$];", 3) -> "return array[3];"
 // Format("array[$2$] = $1$;", "Bla", 3) -> FATAL error (wrong order)
 // Format("array[$1$] = $2$;", 3, "Bla") -> "array[3] = Bla;"
 //
 // The arguments can be used more than once like
 //
 // Format("array[$1$] = $2$;  // Index = $1$", 3, "Bla") ->
 //        "array[3] = Bla;  // Index = 3"
 //
 // If you use more arguments use the following style to help the reader,
 //
 // Format("int $1$() {\n"
 //        "  array[$2$] = $3$;\n"
 //        "  return $4$;"
 //        "}\n",
 //        funname, // 1
 //        idx,  // 2
 //        varname,  // 3
 //        retval);  // 4
 //
 // but consider using named variables. Named variables like $foo$, with some
 // identifier foo, are looked up in the map. One additional feature is that
 // spaces are accepted between the '$' delimiters, $ foo$ will
 // substitute to " bar" if foo stands for "bar", but in case it's empty
 // will substitute to "". Hence, for example,
 //
 // Format(vars, "$dllexport $void fun();") -> "void fun();"
 //                                            "__declspec(export) void fun();"
 //
 // which is convenient to prevent double, leading or trailing spaces.
 class PROTOC_EXPORT Formatter {
  public:
   explicit Formatter(io::Printer* printer) : printer_(printer) {}
   Formatter(io::Printer* printer,
             const absl::flat_hash_map<absl::string_view, std::string>& vars)
       : printer_(printer), vars_(vars) {}

   template <typename T>
   void Set(absl::string_view key, const T& value) {
     vars_[key] = ToString(value);
   }

   template <typename... Args>
   void operator()(const char* format, const Args&... args) const {
     printer_->FormatInternal({ToString(args)...}, vars_, format);
   }

   void Indent() const { printer_->Indent(); }
   void Outdent() const { printer_->Outdent(); }
   io::Printer* printer() const { return printer_; }

   class PROTOC_EXPORT ScopedIndenter {
    public:
     explicit ScopedIndenter(Formatter* format) : format_(format) {
       format_->Indent();
     }
     ~ScopedIndenter() { format_->Outdent(); }

    private:
     Formatter* format_;
   };

   PROTOBUF_NODISCARD ScopedIndenter ScopedIndent() {
     return ScopedIndenter(this);
   }
   template <typename... Args>
   PROTOBUF_NODISCARD ScopedIndenter ScopedIndent(const char* format,
                                                  const Args&&... args) {
     (*this)(format, static_cast<Args&&>(args)...);
     return ScopedIndenter(this);
   }

  private:
   io::Printer* printer_;
   absl::flat_hash_map<absl::string_view, std::string> vars_;

   // Convenience overloads to accept different types as arguments.
   static std::string ToString(absl::string_view s) { return std::string(s); }
   template <typename I, typename = typename std::enable_if<
                             std::is_integral<I>::value>::type>
   static std::string ToString(I x) {
     return absl::StrCat(x);
   }
   static std::string ToString(absl::Hex x) { return absl::StrCat(x); }
   static std::string ToString(const FieldDescriptor* d) {
     return Payload(d, GeneratedCodeInfo::Annotation::NONE);
   }
   static std::string ToString(const Descriptor* d) {
     return Payload(d, GeneratedCodeInfo::Annotation::NONE);
   }
   static std::string ToString(const EnumDescriptor* d) {
     return Payload(d, GeneratedCodeInfo::Annotation::NONE);
   }
   static std::string ToString(const EnumValueDescriptor* d) {
     return Payload(d, GeneratedCodeInfo::Annotation::NONE);
   }
   static std::string ToString(const OneofDescriptor* d) {
     return Payload(d, GeneratedCodeInfo::Annotation::NONE);
   }

   static std::string ToString(
       std::tuple<const FieldDescriptor*,
                  GeneratedCodeInfo::Annotation::Semantic>
           p) {
     return Payload(std::get<0>(p), std::get<1>(p));
   }
   static std::string ToString(
       std::tuple<const Descriptor*, GeneratedCodeInfo::Annotation::Semantic>
           p) {
     return Payload(std::get<0>(p), std::get<1>(p));
   }
   static std::string ToString(
       std::tuple<const EnumDescriptor*, GeneratedCodeInfo::Annotation::Semantic>
           p) {
     return Payload(std::get<0>(p), std::get<1>(p));
   }
   static std::string ToString(
       std::tuple<const EnumValueDescriptor*,
                  GeneratedCodeInfo::Annotation::Semantic>
           p) {
     return Payload(std::get<0>(p), std::get<1>(p));
   }
   static std::string ToString(
       std::tuple<const OneofDescriptor*,
                  GeneratedCodeInfo::Annotation::Semantic>
           p) {
     return Payload(std::get<0>(p), std::get<1>(p));
   }

   template <typename Descriptor>
   static std::string Payload(const Descriptor* descriptor,
                              GeneratedCodeInfo::Annotation::Semantic semantic) {
     std::vector<int> path;
     descriptor->GetLocationPath(&path);
     GeneratedCodeInfo::Annotation annotation;
     for (int index : path) {
       annotation.add_path(index);
     }
     annotation.set_source_file(descriptor->file()->name());
     annotation.set_semantic(semantic);
     return annotation.SerializeAsString();
   }
 };

 template <typename T>
 std::string FieldComment(const T* field, const Options& options) {
   if (options.strip_nonfunctional_codegen) {
     return field->name();
   }
   // Print the field's (or oneof's) proto-syntax definition as a comment.
   // We don't want to print group bodies so we cut off after the first
   // line.
   DebugStringOptions debug_options;
   debug_options.elide_group_body = true;
   debug_options.elide_oneof_body = true;

   for (absl::string_view chunk :
        absl::StrSplit(field->DebugStringWithOptions(debug_options), '\n')) {
     return std::string(chunk);
   }

   return "<unknown>";
 }

 template <class T>
 void PrintFieldComment(const Formatter& format, const T* field,
                        const Options& options) {
   format("// $1$\n", FieldComment(field, options));
 }

 class PROTOC_EXPORT NamespaceOpener {
  public:
   explicit NamespaceOpener(
       io::Printer* p,
       io::Printer::SourceLocation loc = io::Printer::SourceLocation::current())
       : p_(p), loc_(loc) {}

   explicit NamespaceOpener(
       const Formatter& format,
       io::Printer::SourceLocation loc = io::Printer::SourceLocation::current())
       : NamespaceOpener(format.printer(), loc) {}

   NamespaceOpener(
       absl::string_view name, const Formatter& format,
       io::Printer::SourceLocation loc = io::Printer::SourceLocation::current())
       : NamespaceOpener(name, format.printer(), loc) {}

   NamespaceOpener(
       absl::string_view name, io::Printer* p,
       io::Printer::SourceLocation loc = io::Printer::SourceLocation::current())
       : NamespaceOpener(p, loc) {
     ChangeTo(name, loc);
   }

   ~NamespaceOpener() { ChangeTo("", loc_); }

   void ChangeTo(
       absl::string_view name,
       io::Printer::SourceLocation loc = io::Printer::SourceLocation::current());

  private:
   io::Printer* p_;
   io::Printer::SourceLocation loc_;
   std::vector<std::string> name_stack_;
 };

 void GenerateUtf8CheckCodeForString(const FieldDescriptor* field,
                                     const Options& options, bool for_parse,
                                     absl::string_view parameters,
                                     const Formatter& format);

 void GenerateUtf8CheckCodeForCord(const FieldDescriptor* field,
                                   const Options& options, bool for_parse,
                                   absl::string_view parameters,
                                   const Formatter& format);

 void GenerateUtf8CheckCodeForString(io::Printer* p,
                                     const FieldDescriptor* field,
                                     const Options& options, bool for_parse,
                                     absl::string_view parameters);

 void GenerateUtf8CheckCodeForCord(io::Printer* p, const FieldDescriptor* field,
                                   const Options& options, bool for_parse,
                                   absl::string_view parameters);

 inline bool ShouldGenerateExternSpecializations(const Options& options) {
   // For OSS we omit the specializations to reduce codegen size.
   // Some compilers can't handle that much input in a single translation unit.
   // These specializations are just a link size optimization and do not affect
   // correctness or performance, so it is ok to omit them.
   return !options.opensource_runtime;
 }

 struct OneOfRangeImpl {
   struct Iterator {
     using iterator_category = std::forward_iterator_tag;
     using value_type = const OneofDescriptor*;
     using difference_type = int;

     value_type operator*() { return descriptor->oneof_decl(idx); }

     friend bool operator==(const Iterator& a, const Iterator& b) {
       ABSL_DCHECK(a.descriptor == b.descriptor);
       return a.idx == b.idx;
     }
     friend bool operator!=(const Iterator& a, const Iterator& b) {
       return !(a == b);
     }

     Iterator& operator++() {
       idx++;
       return *this;
     }

     int idx;
     const Descriptor* descriptor;
   };

   Iterator begin() const { return {0, descriptor}; }
   Iterator end() const {
     return {descriptor->real_oneof_decl_count(), descriptor};
   }

   const Descriptor* descriptor;
 };

 inline OneOfRangeImpl OneOfRange(const Descriptor* desc) { return {desc}; }

 // Strips ".proto" or ".protodevel" from the end of a filename.
 PROTOC_EXPORT std::string StripProto(absl::string_view filename);

 bool HasMessageFieldOrExtension(const Descriptor* desc);

 // Generates a vector of substitutions for use with Printer::WithVars that
 // contains annotated accessor names for a particular field.
 //
 // Each substitution will be named `absl::StrCat(prefix, "name")`, and will
 // be annotated with `field`.
 std::vector<io::Printer::Sub> AnnotatedAccessors(
     const FieldDescriptor* field, absl::Span<const absl::string_view> prefixes,
     absl::optional<google::protobuf::io::AnnotationCollector::Semantic> semantic =
         absl::nullopt);

 // Check whether `file` represents the .proto file FileDescriptorProto and
 // friends. This file needs special handling because it must be usable during
 // dynamic initialization.
 bool IsFileDescriptorProto(const FileDescriptor* file, const Options& options);

 // Determine if we should generate a class for the descriptor.
 // Some descriptors, like some map entries, are not represented as a generated
 // class.
 bool ShouldGenerateClass(const Descriptor* descriptor, const Options& options);


 // Determine if we need a PostLoopHandler function to inject into TcParseTable's
 // ParseLoop.
 // If this returns true, the parse table generation will use
 // `&ClassName::PostLoopHandler` which should be a static function of the right
 // signature.
 bool NeedsPostLoopHandler(const Descriptor* descriptor, const Options& options);

 }  // namespace cpp
 }  // namespace compiler
 }  // namespace protobuf
 }  // namespace google

 #include "google/protobuf/port_undef.inc"

 #endif  // GOOGLE_PROTOBUF_COMPILER_CPP_HELPERS_H__