gen_backend_stubs.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557
  1. import pathlib
  2. import argparse
  3. import os
  4. import yaml
  5. import re
  6. from collections import namedtuple, Counter, defaultdict
  7. from typing import List, Dict, Union, Sequence, Optional
  8. from torchgen.gen import (
  9. get_grouped_native_functions,
  10. parse_native_yaml,
  11. NamespaceHelper,
  12. )
  13. from torchgen.model import (
  14. BackendIndex,
  15. BackendMetadata,
  16. DispatchKey,
  17. NativeFunction,
  18. NativeFunctionsGroup,
  19. OperatorName,
  20. )
  21. from torchgen.selective_build.selector import SelectiveBuilder
  22. from torchgen.utils import Target, concatMap, context, YamlLoader, FileManager
  23. from torchgen.context import native_function_manager
  24. from torchgen.code_template import CodeTemplate
  25. import torchgen.dest as dest
  26. import torchgen.api.dispatcher as dispatcher
  27. from torchgen.api.types import DispatcherSignature
  28. # Parses the external backend's yaml, and adds a new BackendIndex for the backend's dispatch key.
  29. # Returns a Tuple of (backend_key, autograd_key, cpp_namespace, updated BackendIndex mapping)
  30. ParsedExternalYaml = namedtuple(
  31. "ParsedExternalYaml",
  32. ["backend_key", "autograd_key", "class_name", "cpp_namespace", "backend_indices"],
  33. )
  34. def parse_backend_yaml(
  35. backend_yaml_path: str,
  36. grouped_native_functions: Sequence[Union[NativeFunction, NativeFunctionsGroup]],
  37. backend_indices: Dict[DispatchKey, BackendIndex],
  38. ) -> ParsedExternalYaml:
  39. native_functions_map: Dict[OperatorName, NativeFunction] = {
  40. f.func.name: f
  41. for f in concatMap(
  42. lambda f: [f] if isinstance(f, NativeFunction) else list(f.functions()),
  43. grouped_native_functions,
  44. )
  45. }
  46. with open(backend_yaml_path, "r") as f:
  47. yaml_values = yaml.load(f, Loader=YamlLoader)
  48. assert isinstance(yaml_values, dict)
  49. valid_keys = [
  50. "backend",
  51. "class_name",
  52. "cpp_namespace",
  53. "extra_headers",
  54. "supported",
  55. "autograd",
  56. "full_codegen",
  57. ]
  58. backend = yaml_values.pop("backend", None)
  59. assert backend is not None, 'You must provide a value for "backend"'
  60. class_name = yaml_values.pop("class_name", None)
  61. cpp_namespace = yaml_values.pop("cpp_namespace", None)
  62. assert cpp_namespace is not None, 'You must provide a value for "cpp_namespace"'
  63. # Mostly just defaulting to false to stick with LazyTensor convention.
  64. use_out_as_primary = yaml_values.pop("use_out_as_primary", False)
  65. assert isinstance(
  66. use_out_as_primary, bool
  67. ), f"You must provide either True or False for use_out_as_primary. Provided: {use_out_as_primary}"
  68. use_device_guard = yaml_values.pop("device_guard", False)
  69. assert isinstance(
  70. use_device_guard, bool
  71. ), f"You must provide either True or False for device_guard. Provided: {use_device_guard}"
  72. supported = yaml_values.pop("supported", [])
  73. if supported is None:
  74. supported = [] # Allow an empty list of supported ops
  75. assert isinstance(
  76. supported, list
  77. ), f'expected "supported" to be a list, but got: {supported} (of type {type(supported)})'
  78. supported_autograd = yaml_values.pop("autograd", [])
  79. assert isinstance(
  80. supported_autograd, list
  81. ), f'expected "autograd" to be a list, but got: {supported_autograd}'
  82. # full_codegen is ignored by parse_backend_yaml, and re-parsed in gen_lazy_tensor.py
  83. full_codegen = yaml_values.pop("full_codegen", [])
  84. supported.extend(full_codegen)
  85. assert (
  86. len(yaml_values.keys()) == 0
  87. ), f'{backend_yaml_path} contains unexpected keys: {", ".join(yaml_values.keys())}. \
  88. Only the following keys are supported: {", ".join(valid_keys)}'
  89. def create_backend_index(
  90. backend_ops: List[str],
  91. dispatch_key: DispatchKey,
  92. *,
  93. use_out_as_primary: bool,
  94. use_device_guard: bool,
  95. ) -> BackendIndex:
  96. metadata: Dict[OperatorName, BackendMetadata] = {}
  97. for op in backend_ops:
  98. op_name = OperatorName.parse(op)
  99. assert (
  100. op_name in native_functions_map
  101. ), f"Found an invalid operator name: {op_name}"
  102. # See Note [External Backends Follow Dispatcher API]
  103. kernel_name = dispatcher.name(native_functions_map[op_name].func)
  104. # TODO: allow structured external backends later.
  105. m = BackendMetadata(kernel=kernel_name, structured=False)
  106. metadata[op_name] = m
  107. return BackendIndex(
  108. dispatch_key=dispatch_key,
  109. use_out_as_primary=use_out_as_primary,
  110. external=True,
  111. device_guard=use_device_guard,
  112. index=metadata,
  113. )
  114. backend_key: Optional[DispatchKey] = None
  115. if len(supported) > 0:
  116. with context(
  117. lambda: f'The provided value for "backend" must be a valid DispatchKey, but got {backend}.'
  118. ):
  119. backend_key = DispatchKey.parse(backend)
  120. backend_idx = create_backend_index(
  121. supported,
  122. backend_key,
  123. use_out_as_primary=use_out_as_primary,
  124. use_device_guard=use_device_guard,
  125. )
  126. assert backend_key not in backend_indices
  127. backend_indices[backend_key] = backend_idx
  128. autograd_key: Optional[DispatchKey] = None
  129. if len(supported_autograd) > 0:
  130. with context(
  131. lambda: f'The "autograd" key was specified, which indicates that you would like to override \
  132. the behavior of autograd for some operators on your backend. However "Autograd{backend}" is not a valid DispatchKey.'
  133. ):
  134. autograd_key = DispatchKey.parse(f"Autograd{backend}")
  135. autograd_idx = create_backend_index(
  136. supported_autograd,
  137. autograd_key,
  138. use_out_as_primary=use_out_as_primary,
  139. use_device_guard=use_device_guard,
  140. )
  141. assert autograd_key not in backend_indices
  142. backend_indices[autograd_key] = autograd_idx
  143. for g in grouped_native_functions:
  144. if isinstance(g, NativeFunction):
  145. forward_kernels = (
  146. []
  147. if backend_key is None
  148. else [
  149. m
  150. for m in [backend_indices[backend_key].get_kernel(g)]
  151. if m is not None
  152. ]
  153. )
  154. backward_kernels = (
  155. []
  156. if autograd_key is None
  157. else [
  158. m
  159. for m in [backend_indices[autograd_key].get_kernel(g)]
  160. if m is not None
  161. ]
  162. )
  163. else:
  164. forward_kernels = (
  165. []
  166. if backend_key is None
  167. else [
  168. m
  169. for m in [
  170. backend_indices[backend_key].get_kernel(f)
  171. for f in g.functions()
  172. ]
  173. if m is not None
  174. ]
  175. )
  176. backward_kernels = (
  177. []
  178. if autograd_key is None
  179. else [
  180. m
  181. for m in [
  182. backend_indices[autograd_key].get_kernel(f)
  183. for f in g.functions()
  184. ]
  185. if m is not None
  186. ]
  187. )
  188. forward_kernels = [f for f in forward_kernels if f is not None]
  189. backward_kernels = [f for f in backward_kernels if f is not None]
  190. assert (
  191. len(forward_kernels) == 0 or len(backward_kernels) == 0
  192. ), f'Currently, all variants of an op must either be registered to a backend key, or to a backend\'s \
  193. autograd key. They cannot be mix and matched. If this is something you need, feel free to create an issue! \
  194. {forward_kernels[0].kernel} is listed under "supported", but {backward_kernels[0].kernel} is listed under "autograd".'
  195. return ParsedExternalYaml(
  196. backend_key, autograd_key, class_name, cpp_namespace, backend_indices
  197. )
  198. def error_on_missing_kernels(
  199. native_functions: Sequence[NativeFunction],
  200. backend_indices: Dict[DispatchKey, BackendIndex],
  201. backend_key: DispatchKey,
  202. autograd_key: Optional[DispatchKey],
  203. class_name: str,
  204. kernel_defn_file_path: str,
  205. full_codegen: Optional[List[OperatorName]] = None,
  206. ) -> None:
  207. try:
  208. with open(kernel_defn_file_path, "r") as f:
  209. backend_defns = f.read()
  210. except IOError:
  211. raise AssertionError(
  212. f"Unable to read from the specified impl_path file: {kernel_defn_file_path}"
  213. )
  214. if full_codegen is None:
  215. full_codegen = []
  216. expected_backend_op_names: List[OperatorName] = (
  217. list(backend_indices[backend_key].index.keys()) + []
  218. if autograd_key is None
  219. else list(backend_indices[autograd_key].index.keys())
  220. )
  221. expected_backend_native_funcs: List[NativeFunction] = [
  222. f
  223. for f in native_functions
  224. if f.func.name in expected_backend_op_names and f.func.name not in full_codegen
  225. ]
  226. expected_backend_kernel_name_counts: Dict[str, List[NativeFunction]] = defaultdict(
  227. list
  228. )
  229. for native_f in expected_backend_native_funcs:
  230. expected_backend_kernel_name_counts[dispatcher.name(native_f.func)].append(
  231. native_f
  232. )
  233. kernel_defn_regex = rf"{class_name}::([\w\d]*)\([^\)]*\)\s*{{"
  234. actual_backend_kernel_name_counts = Counter(
  235. re.findall(kernel_defn_regex, backend_defns)
  236. )
  237. missing_kernels_err_msg = ""
  238. for expected_name, funcs in expected_backend_kernel_name_counts.items():
  239. expected_overload_count = len(funcs)
  240. actual_overload_count = actual_backend_kernel_name_counts[expected_name]
  241. if expected_overload_count != actual_overload_count:
  242. def create_decl(f: NativeFunction) -> str:
  243. with native_function_manager(f):
  244. return DispatcherSignature.from_schema(f.func).decl()
  245. expected_schemas_str = "\n".join([create_decl(f) for f in funcs])
  246. missing_kernels_err_msg += f"""
  247. {class_name} is missing a kernel definition for {expected_name}. We found {actual_overload_count} kernel(s) with that name,
  248. but expected {expected_overload_count} kernel(s). The expected function schemas for the missing operator are:
  249. {expected_schemas_str}
  250. """
  251. assert missing_kernels_err_msg == "", missing_kernels_err_msg
  252. def main() -> None:
  253. parser = argparse.ArgumentParser(description="Generate backend stub files")
  254. parser.add_argument(
  255. "-s",
  256. "--source_yaml",
  257. help="path to source yaml file containing operator external definitions",
  258. )
  259. parser.add_argument("-o", "--output_dir", help="output directory")
  260. parser.add_argument("--dry_run", type=bool, default=False, help="output directory")
  261. parser.add_argument(
  262. "--impl_path",
  263. type=str,
  264. default=None,
  265. help="path to the source C++ file containing kernel definitions",
  266. )
  267. options = parser.parse_args()
  268. run(options.source_yaml, options.output_dir, options.dry_run, options.impl_path)
  269. def gen_dispatchkey_nativefunc_headers(
  270. fm: FileManager,
  271. class_name: str,
  272. cpp_namespace: str,
  273. backend_indices: Dict[DispatchKey, BackendIndex],
  274. grouped_native_functions: Sequence[Union[NativeFunction, NativeFunctionsGroup]],
  275. backend_dispatch_key: DispatchKey,
  276. autograd_dispatch_key: Optional[DispatchKey],
  277. backend_name: str = "",
  278. ) -> None:
  279. assert class_name is not None
  280. generated_comment = (
  281. "Autogenerated file by gen_backend_stubs.py. Do not edit directly!"
  282. )
  283. # Convert to a set first to remove duplicate kernel names.
  284. # Backends are allowed to repeat kernel names; only generate the declaration once!
  285. # Sort for deterministic output.
  286. backend_declarations = list(
  287. sorted(
  288. set(
  289. concatMap(
  290. lambda f: dest.compute_native_function_declaration(
  291. f, backend_indices[backend_dispatch_key]
  292. ),
  293. grouped_native_functions,
  294. )
  295. )
  296. )
  297. )
  298. autograd_declarations = list(
  299. sorted(
  300. set(
  301. concatMap(
  302. lambda f: []
  303. if autograd_dispatch_key is None
  304. else dest.compute_native_function_declaration(
  305. f, backend_indices[autograd_dispatch_key]
  306. ),
  307. grouped_native_functions,
  308. )
  309. )
  310. )
  311. )
  312. ns_helper = NamespaceHelper(cpp_namespace)
  313. fm.write_with_template(
  314. f"{backend_dispatch_key}NativeFunctions.h",
  315. "DispatchKeyNativeFunctions.h",
  316. lambda: {
  317. "generated_comment": generated_comment,
  318. "namespace_prologue": ns_helper.prologue,
  319. "class_name": class_name,
  320. "namespace_epilogue": ns_helper.epilogue,
  321. "dispatch_declarations": backend_declarations + autograd_declarations,
  322. "BackendName": backend_name,
  323. "DispatchKey": backend_dispatch_key,
  324. },
  325. )
  326. def gen_dispatcher_registrations(
  327. fm: FileManager,
  328. output_dir: str,
  329. class_name: str,
  330. cpp_namespace: str,
  331. backend_indices: Dict[DispatchKey, BackendIndex],
  332. grouped_native_functions: Sequence[Union[NativeFunction, NativeFunctionsGroup]],
  333. backend_dispatch_key: DispatchKey,
  334. dispatch_key: DispatchKey,
  335. selector: "SelectiveBuilder",
  336. # build_in_tree is true for lazy TS backend and affects include paths, not used for external backends
  337. build_in_tree: bool = False,
  338. per_operator_headers: bool = False,
  339. backend_name: str = "",
  340. eager_registration: bool = True,
  341. ) -> None:
  342. headers = [
  343. f"{output_dir}/{backend_dispatch_key}NativeFunctions.h",
  344. ]
  345. if build_in_tree:
  346. external_backend_headers_str = "\n".join(f"#include <{h}>" for h in headers)
  347. else:
  348. external_backend_headers_str = "\n".join(f'#include "{h}"' for h in headers)
  349. assert class_name is not None
  350. backend_index = backend_indices[dispatch_key]
  351. dispatch_registrations_body = list(
  352. concatMap(
  353. dest.RegisterDispatchKey(
  354. backend_index,
  355. Target.REGISTRATION,
  356. selector,
  357. rocm=False,
  358. cpp_namespace=cpp_namespace,
  359. class_method_name=f"{class_name}",
  360. skip_dispatcher_op_registration=False,
  361. ),
  362. grouped_native_functions,
  363. )
  364. )
  365. deferred_dispatch_registrations = ""
  366. static_init_dispatch_registrations = ""
  367. if eager_registration:
  368. static_template = CodeTemplate(
  369. """\
  370. TORCH_LIBRARY_IMPL(aten, $dispatch_key, m) {
  371. $dispatch_registrations_body
  372. };"""
  373. )
  374. static_init_dispatch_registrations = static_template.substitute(
  375. dispatch_key=dispatch_key,
  376. dispatch_registrations_body=dispatch_registrations_body,
  377. )
  378. else:
  379. deferred_template = CodeTemplate(
  380. """\
  381. TORCH_API void Register${backend_name}${dispatch_key}NativeFunctions() {
  382. static auto m = MAKE_TORCH_LIBRARY_IMPL(aten, $dispatch_key);
  383. $dispatch_registrations_body
  384. }"""
  385. )
  386. deferred_dispatch_registrations = deferred_template.substitute(
  387. backend_name=backend_name,
  388. dispatch_key=dispatch_key,
  389. dispatch_registrations_body=dispatch_registrations_body,
  390. )
  391. fm.write_with_template(
  392. f"Register{dispatch_key}.cpp",
  393. "RegisterDispatchKey.cpp",
  394. lambda: {
  395. "static_init_dispatch_registrations": static_init_dispatch_registrations,
  396. "deferred_dispatch_registrations": deferred_dispatch_registrations,
  397. "extra_cuda_headers": "",
  398. "external_backend_headers": external_backend_headers_str,
  399. "ops_headers": "#include <ATen/Functions.h>"
  400. if not per_operator_headers
  401. else "",
  402. "DispatchKey": dispatch_key,
  403. "dispatch_namespace": dispatch_key.lower(),
  404. "dispatch_headers": dest.gen_registration_headers(
  405. backend_index, per_operator_headers=per_operator_headers, rocm=False
  406. ),
  407. "dispatch_helpers": dest.gen_registration_helpers(backend_index),
  408. "dispatch_namespaced_definitions": "",
  409. "dispatch_anonymous_definitions": list(
  410. concatMap(
  411. dest.RegisterDispatchKey(
  412. backend_index,
  413. Target.ANONYMOUS_DEFINITION,
  414. selector,
  415. rocm=False,
  416. cpp_namespace=cpp_namespace,
  417. class_method_name=f"{class_name}",
  418. skip_dispatcher_op_registration=False,
  419. ),
  420. grouped_native_functions,
  421. )
  422. ),
  423. },
  424. )
  425. def run(
  426. source_yaml: str, output_dir: str, dry_run: bool, impl_path: Optional[str] = None
  427. ) -> None:
  428. # Assumes that this file lives at PYTORCH_ROOT/torchgen/gen_backend_stubs.py
  429. pytorch_root = pathlib.Path(__file__).parent.parent.absolute()
  430. template_dir = os.path.join(pytorch_root, "aten/src/ATen/templates")
  431. def make_file_manager(install_dir: str) -> FileManager:
  432. return FileManager(
  433. install_dir=install_dir, template_dir=template_dir, dry_run=dry_run
  434. )
  435. fm = make_file_manager(output_dir)
  436. native_yaml_path = os.path.join(
  437. pytorch_root, "aten/src/ATen/native/native_functions.yaml"
  438. )
  439. tags_yaml_path = os.path.join(pytorch_root, "aten/src/ATen/native/tags.yaml")
  440. parsed_yaml = parse_native_yaml(native_yaml_path, tags_yaml_path)
  441. native_functions, backend_indices = (
  442. parsed_yaml.native_functions,
  443. parsed_yaml.backend_indices,
  444. )
  445. grouped_native_functions = get_grouped_native_functions(native_functions)
  446. parsed_backend_yaml = parse_backend_yaml(
  447. source_yaml, grouped_native_functions, backend_indices
  448. )
  449. backend_key = parsed_backend_yaml.backend_key
  450. autograd_key = parsed_backend_yaml.autograd_key
  451. cpp_namespace = parsed_backend_yaml.cpp_namespace
  452. class_name = parsed_backend_yaml.class_name
  453. backend_indices = parsed_backend_yaml.backend_indices
  454. selector = SelectiveBuilder.get_nop_selector()
  455. if backend_key is None:
  456. # This could be useful if a backend wants to quickly set up a noop yaml file but doesn't have any kernels ready yet.
  457. return
  458. if class_name is None:
  459. # class_name is an optional argument to backend yaml file.
  460. # if specified it allows an external backend to override
  461. # the name of the class that all generated kernel definitions live under.
  462. # if not specified, its value is given as native_function_class_name.
  463. class_name = backend_indices[backend_key].native_function_class_name()
  464. assert class_name is not None
  465. if impl_path is not None:
  466. error_on_missing_kernels(
  467. native_functions,
  468. backend_indices,
  469. backend_key,
  470. autograd_key,
  471. class_name,
  472. impl_path,
  473. )
  474. gen_dispatchkey_nativefunc_headers(
  475. fm,
  476. class_name,
  477. cpp_namespace,
  478. backend_indices,
  479. grouped_native_functions,
  480. backend_key,
  481. autograd_key,
  482. )
  483. for dispatch_key in (
  484. [backend_key] if autograd_key is None else [backend_key, autograd_key]
  485. ):
  486. gen_dispatcher_registrations(
  487. fm,
  488. output_dir,
  489. class_name,
  490. cpp_namespace,
  491. backend_indices,
  492. grouped_native_functions,
  493. backend_key,
  494. dispatch_key,
  495. selector,
  496. )
  497. if __name__ == "__main__":
  498. main()