summaryrefslogtreecommitdiff
path: root/mesonbuild/modules
diff options
context:
space:
mode:
authorDylan Baker <dylan@pnwbakers.com>2024-07-23 09:40:12 -0700
committerDylan Baker <dylan@pnwbakers.com>2025-10-24 22:20:49 -0700
commit6aefc92c33f7bef17c338aa3e456dc45ca41058a (patch)
treefce85244140e726204387e380fd5b9f29c2c24fa /mesonbuild/modules
parentf4650db5b06371eeb37005245366325723eadf9e (diff)
downloadmeson-6aefc92c33f7bef17c338aa3e456dc45ca41058a.tar.gz
modules/codegen: Add wrapper for lex/flex/reflex
This module is a bit of a dumping ground for code generators, particularly ones that are important and non-trivial to wrap, either due to multiple implementations, major command line changes, or complex outputs (such as those that may output a directory structure). The initially provided method is for lex. It provides a simple wrapper that handles win_flex, reflex, flex, and generic lex.
Diffstat (limited to 'mesonbuild/modules')
-rw-r--r--mesonbuild/modules/codegen.py274
1 files changed, 274 insertions, 0 deletions
diff --git a/mesonbuild/modules/codegen.py b/mesonbuild/modules/codegen.py
new file mode 100644
index 000000000..b52f36f6d
--- /dev/null
+++ b/mesonbuild/modules/codegen.py
@@ -0,0 +1,274 @@
+# SPDX-License-Identifier: Apache-2.0
+# Copyright © 2024-2025 Intel Corporation
+
+from __future__ import annotations
+import dataclasses
+import os
+import typing as T
+
+from . import ExtensionModule, ModuleInfo
+from ..build import CustomTarget, CustomTargetIndex, GeneratedList
+from ..compilers.compilers import lang_suffixes
+from ..interpreter.interpreterobjects import extract_required_kwarg
+from ..interpreter.type_checking import NoneType, REQUIRED_KW, DISABLER_KW, NATIVE_KW
+from ..interpreterbase import (
+ ContainerTypeInfo, ObjectHolder, KwargInfo, typed_pos_args, typed_kwargs,
+ noPosargs, noKwargs, disablerIfNotFound, InterpreterObject
+)
+from ..mesonlib import File, MesonException, Popen_safe
+from ..programs import ExternalProgram, NonExistingExternalProgram
+from ..utils.core import HoldableObject
+from .. import mlog
+
+if T.TYPE_CHECKING:
+ from typing_extensions import Literal, TypeAlias, TypedDict
+
+ from . import ModuleState
+ from .._typing import ImmutableListProtocol
+ from ..build import Executable
+ from ..interpreter import Interpreter
+ from ..interpreter.kwargs import ExtractRequired
+ from ..interpreterbase import TYPE_var, TYPE_kwargs
+ from ..mesonlib import MachineChoice
+ from ..programs import OverrideProgram
+
+ Program: TypeAlias = T.Union[Executable, ExternalProgram, OverrideProgram]
+ LexImpls = Literal['lex', 'flex', 'reflex', 'win_flex']
+
+ class LexGenerateKwargs(TypedDict):
+
+ args: T.List[str]
+ source: T.Optional[str]
+ header: T.Optional[str]
+ table: T.Optional[str]
+ plainname: bool
+
+ class FindLexKwargs(ExtractRequired):
+
+ lex_version: T.List[str]
+ flex_version: T.List[str]
+ reflex_version: T.List[str]
+ win_flex_version: T.List[str]
+ implementations: T.List[LexImpls]
+ native: MachineChoice
+
+
+def is_subset_validator(choices: T.Set[str]) -> T.Callable[[T.List[str]], T.Optional[str]]:
+
+ def inner(check: T.List[str]) -> T.Optional[str]:
+ if not set(check).issubset(choices):
+ invalid = ', '.join(sorted(set(check).difference(choices)))
+ valid = ', '.join(sorted(choices))
+ return f"valid members are '{valid}', not '{invalid}'"
+ return None
+
+ return inner
+
+
+@dataclasses.dataclass
+class _CodeGenerator(HoldableObject):
+
+ name: str
+ program: Program
+ arguments: ImmutableListProtocol[str] = dataclasses.field(default_factory=list)
+
+ def command(self) -> T.List[T.Union[Program, str]]:
+ return (T.cast('T.List[T.Union[Program, str]]', [self.program]) +
+ T.cast('T.List[T.Union[Program, str]]', self.arguments))
+
+ def found(self) -> bool:
+ return self.program.found()
+
+
+@dataclasses.dataclass
+class LexGenerator(_CodeGenerator):
+ pass
+
+
+class LexHolder(ObjectHolder[LexGenerator]):
+
+ @noPosargs
+ @noKwargs
+ @InterpreterObject.method('generate')
+ def implementation_method(self, args: T.List[TYPE_var], kwargs: TYPE_kwargs) -> str:
+ return self.held_object.name
+
+ @noPosargs
+ @noKwargs
+ @InterpreterObject.method('found')
+ def found_method(self, args: T.List[TYPE_var], kwargs: TYPE_kwargs) -> bool:
+ return self.held_object.found()
+
+ @typed_pos_args('codegen.lex.generate', (str, File, GeneratedList, CustomTarget, CustomTargetIndex))
+ @typed_kwargs(
+ 'codegen.lex.generate',
+ KwargInfo('args', ContainerTypeInfo(list, str), default=[], listify=True),
+ KwargInfo('source', (str, NoneType)),
+ KwargInfo('header', (str, NoneType)),
+ KwargInfo('table', (str, NoneType)),
+ KwargInfo('plainname', bool, default=False),
+ )
+ @InterpreterObject.method('generate')
+ def generate_method(self, args: T.Tuple[T.Union[str, File, GeneratedList, CustomTarget, CustomTargetIndex]], kwargs: LexGenerateKwargs) -> CustomTarget:
+ if not self.held_object.found():
+ raise MesonException('Attempted to call generate without finding a lex implementation')
+
+ input = self.interpreter.source_strings_to_files([args[0]])[0]
+ if isinstance(input, File):
+ is_cpp = input.endswith(".ll")
+ name = os.path.splitext(input.fname)[0]
+ else:
+ gen_input = input.get_outputs()
+ if len(gen_input) != 1:
+ raise MesonException('codegen.lex.generate: generated type inputs must have exactly one output, index into them to select the correct input')
+ is_cpp = gen_input[0].endswith('.ll')
+ name = os.path.splitext(gen_input[0])[0]
+ name = os.path.basename(name)
+
+ # If an explicit source was given, use that to determine whether the
+ # user expects this to be a C or C++ source.
+ if kwargs['source'] is not None:
+ ext = kwargs['source'].rsplit('.', 1)[1]
+ is_cpp = ext in lang_suffixes['cpp']
+
+ for_machine = self.held_object.program.for_machine
+
+ # Flex uses FlexLexer.h for C++ code
+ if is_cpp and self.held_object.name in {'flex', 'win_flex'}:
+ try:
+ comp = self.interpreter.environment.coredata.compilers[for_machine]['cpp']
+ except KeyError:
+ raise MesonException(f"Could not find a C++ compiler for {for_machine} to search for FlexLexer.h")
+ found, _ = comp.has_header('FlexLexer.h', '', self.interpreter.environment)
+ if not found:
+ raise MesonException('Could not find FlexLexer.h, which is required for Flex with C++')
+
+ if kwargs['source'] is None:
+ outputs = ['@{}@.{}'.format(
+ 'PLAINNAME' if kwargs['plainname'] else 'BASENAME',
+ 'cpp' if is_cpp else 'c')]
+ else:
+ outputs = [kwargs['source']]
+
+ command = self.held_object.command()
+ if kwargs['header'] is not None:
+ outputs.append(kwargs['header'])
+ command.append(f'--header-file=@OUTPUT{len(outputs) - 1}@')
+ if kwargs['table'] is not None:
+ outputs.append(kwargs['table'])
+ command.append(f'--tables-file=@OUTPUT{len(outputs) - 1}@')
+ command.extend(kwargs['args'])
+ # Flex, at least, seems to require that input be the last argument given
+ command.append('@INPUT@')
+
+ target = CustomTarget(
+ f'codegen-lex-{name}-{for_machine.get_lower_case_name()}',
+ self.interpreter.subdir,
+ self.interpreter.subproject,
+ self.interpreter.environment,
+ command,
+ [input],
+ outputs,
+ backend=self.interpreter.backend,
+ description='Generating lexer {{}} with {}'.format(self.held_object.name),
+ )
+ self.interpreter.add_target(target.name, target)
+
+ return target
+
+
+class CodeGenModule(ExtensionModule):
+
+ """Module with helpers for codegen wrappers."""
+
+ INFO = ModuleInfo('codegen', '1.10.0', unstable=True)
+
+ def __init__(self, interpreter: Interpreter) -> None:
+ super().__init__(interpreter)
+ self.methods.update({
+ 'lex': self.lex_method,
+ })
+
+ @noPosargs
+ @typed_kwargs(
+ 'codegen.lex',
+ KwargInfo('lex_version', ContainerTypeInfo(list, str), default=[], listify=True),
+ KwargInfo('flex_version', ContainerTypeInfo(list, str), default=[], listify=True),
+ KwargInfo('reflex_version', ContainerTypeInfo(list, str), default=[], listify=True),
+ KwargInfo('win_flex_version', ContainerTypeInfo(list, str), default=[], listify=True),
+ KwargInfo(
+ 'implementations',
+ ContainerTypeInfo(list, str),
+ default=[],
+ listify=True,
+ validator=is_subset_validator({'lex', 'flex', 'reflex', 'win_flex'})
+ ),
+ REQUIRED_KW,
+ DISABLER_KW,
+ NATIVE_KW
+ )
+ @disablerIfNotFound
+ def lex_method(self, state: ModuleState, args: T.Tuple, kwargs: FindLexKwargs) -> LexGenerator:
+ disabled, required, feature = extract_required_kwarg(kwargs, state.subproject)
+ if disabled:
+ mlog.log('generator lex skipped: feature', mlog.bold(feature), 'disabled')
+ return LexGenerator('lex', NonExistingExternalProgram('lex'))
+
+ names: T.List[LexImpls] = []
+ if kwargs['implementations']:
+ names = kwargs['implementations']
+ else:
+ assert state.environment.machines[kwargs['native']] is not None, 'for mypy'
+ if state.environment.machines[kwargs['native']].system == 'windows':
+ names.append('win_flex')
+ names.extend(['flex', 'reflex', 'lex'])
+
+ versions: T.Mapping[str, T.List[str]] = {
+ 'lex': kwargs['lex_version'],
+ 'flex': kwargs['flex_version'],
+ 'reflex': kwargs['reflex_version'],
+ 'win_flex': kwargs['win_flex_version']
+ }
+
+ for name in names:
+ bin = state.find_program(
+ name, wanted=versions[name], for_machine=kwargs['native'], required=False)
+ if bin.found():
+ # If you're building reflex as a subproject, we consider that you
+ # know what you're doing.
+ if name == 'reflex' and isinstance(bin, ExternalProgram):
+ # there are potentially 3 programs called "reflex":
+ # 1. https://invisible-island.net/reflex/, an alternate fork
+ # of the original flex, this is supported
+ # 2. https://www.genivia.com/doc/reflex/html/, an
+ # alternative implementation for generating C++ scanners.
+ # Not supported
+ # 3. https://github.com/cespare/reflex, which is not a lex
+ # implementation at all, but a file watcher
+ _, out, err = Popen_safe(bin.get_command() + ['--version'])
+ if 'unknown flag: --version' in err:
+ mlog.debug('Skipping cespare/reflex, which is not a lexer and is not supported')
+ continue
+ if 'Written by Robert van Engelen' in out:
+ mlog.debug('Skipping RE/flex, which is not compatible with POSIX lex.')
+ continue
+ break
+ else:
+ if required:
+ raise MesonException.from_node(
+ 'Could not find a lex implementation. Tried: ', ", ".join(names),
+ node=state.current_node)
+ return LexGenerator(name, bin)
+
+ lex_args: T.List[str] = []
+ # This option allows compiling with MSVC
+ # https://github.com/lexxmark/winflexbison/blob/master/UNISTD_ERROR.readme
+ if bin.name == 'win_flex' and state.environment.machines[kwargs['native']].is_windows():
+ lex_args.append('--wincompat')
+ lex_args.extend(['-o', '@OUTPUT0@'])
+ return LexGenerator(name, bin, T.cast('ImmutableListProtocol[str]', lex_args))
+
+
+def initialize(interpreter: Interpreter) -> CodeGenModule:
+ interpreter.append_holder_map(LexGenerator, LexHolder)
+ return CodeGenModule(interpreter)