| # Copyright 2022 Google LLC |
| # |
| # Licensed under the Apache License, Version 2.0 (the "License"); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| |
| """Build rules to create cc_library that implements the InGrammar domain for a |
| given grammar from an ANTLRv4 grammar specification.""" |
| |
| load("@rules_cc//cc:cc_library.bzl", "cc_library") |
| |
| def cc_fuzztest_grammar_library(name, srcs, top_level_rule = None, insert_whitespace = False): |
| """Generates the C++ library corresponding to an antlr4 grammar specification. |
| |
| Args: |
| |
| name: The name of the package to use for the cc_library. For example: |
| `"json_grammar"`. |
| srcs: The grammar specification files in ANTRLv4 format. For example: |
| `["json.g4"]`. |
| top_level_rule: The top level rule of the grammar that we use to generate |
| sentences. It will also be used in the generated domain name. For |
| example, if you set `top_level_rule="json"`, the generated domain name |
| will be `InJsonDomain` and it generates strings starting from the rule |
| `json` in your grammar file. |
| insert_whitespace: False by default. If set to True, the codegen will deterministically |
| insert a single whitespace between tokens/subrules in applicable rules. This |
| is useful when the original ANTLR grammar skips whitespaces. Inserting |
| whitespaces can help the lexer disambiguate certain tokens like keywords |
| vs identifiers. |
| """ |
| |
| output_file_name = name + ".h" |
| cmd = "$(location @com_google_fuzztest//tools:grammar_domain_code_generator)" + \ |
| " --output_header_file_path " + "$(@D)/" + output_file_name + \ |
| (" --insert_whitespace" if insert_whitespace else " --noinsert_whitespace") + \ |
| " --input_grammar_files " + "`echo $(SRCS) | tr ' ' ','`" |
| if top_level_rule: |
| cmd += " --top_level_rule " + top_level_rule |
| |
| native.genrule( |
| name = name + "_source", |
| srcs = srcs, |
| outs = [output_file_name], |
| cmd = cmd, |
| heuristic_label_expansion = False, |
| tools = ["@com_google_fuzztest//tools:grammar_domain_code_generator"], |
| ) |
| cc_library( |
| name = name, |
| hdrs = [output_file_name], |
| deps = ["@com_google_fuzztest//fuzztest/internal/domains:in_grammar_impl"], |
| ) |