import logging import typing from torch._inductor.utils import IndentedBuffer __all__ = [] # type: ignore[var-annotated] logger = logging.getLogger(__name__) def _get_main_cpp_file( package_name: str, model_names: list[str], cuda: bool, example_inputs_map: typing.Optional[dict[str, int]], ) -> str: """ Generates a main.cpp file for AOTInductor standalone models in the specified package. Args: package_name (str): Name of the package containing the models. model_names (List[str]): List of model names to include in the generated main.cpp. cuda (bool): Whether to generate code with CUDA support. example_inputs_map (Optional[Dict[str, List[Tensor]]]): A mapping from model name to its list of example input tensors. If provided, the generated main.cpp will load and run these inputs. Returns: str: The contents of the generated main.cpp file as a string. """ ib = IndentedBuffer() ib.writelines( [ "#include ", "#include ", "#include ", "#include ", "#include ", "#include ", "#include ", ] ) if cuda: ib.writelines( [ "#include ", "#include ", ] ) for model_name in model_names: ib.writeline( f'#include "{package_name}/data/aotinductor/{model_name}/{model_name}.h"' ) ib.newline() for model_name in model_names: ib.writeline(f"using torch::aot_inductor::AOTInductorModel{model_name};") ib.writelines( [ "using torch::aot_inductor::ConstantHandle;", "using torch::aot_inductor::ConstantMap;", "", "int main(int argc, char* argv[]) {", ] ) with ib.indent(): ib.writeline(f'std::string device_str = "{"cuda" if cuda else "cpu"}";') ib.writeline("try {") with ib.indent(): ib.writeline("c10::Device device(device_str);") if example_inputs_map is not None: # TODO: add device for i, model_name in enumerate(model_names): num_inputs = example_inputs_map[model_name] ib.writeline(f"// Load input tensors for model {model_name}") ib.writeline(f"std::vector input_tensors{i + 1};") ib.writeline(f"for (int j = 0; j < {num_inputs}; ++j) {{") with ib.indent(): ib.writeline( f'std::string filename = "{model_name}_input_" + std::to_string(j) + ".pt";' ) ib.writeline("std::ifstream in(filename, std::ios::binary);") ib.writeline("if (!in.is_open()) {") with ib.indent(): ib.writeline( 'std::cerr << "Failed to open file: " << filename << std::endl;' ) ib.writeline("return 1;") ib.writeline("}") ib.writeline( "std::vector buffer((std::istreambuf_iterator(in)), std::istreambuf_iterator());" ) ib.writeline( "torch::IValue ivalue = torch::pickle_load(buffer);" ) ib.writeline( f"input_tensors{i + 1}.push_back(ivalue.toTensor().to(device));" ) ib.writeline("}") ib.newline() ib.newline() ib.writeline("\n// Create array of input handles") for i in range(len(model_names)): ib.writelines( [ f"auto input_handles{i + 1} =", f" torch::aot_inductor::unsafe_alloc_new_handles_from_tensors(input_tensors{i + 1});", ] ) ib.writeline("\n// Create array for output handles") for i in range(len(model_names)): ib.writeline(f"AtenTensorHandle output_handle{i + 1};") ib.writeline("\n// Create and load models") for i, model_name in enumerate(model_names): ib.writelines( [ f"auto constants_map{i + 1} = std::make_shared();", f"auto constants_array{i + 1} = std::make_shared>();", f"auto model{i + 1} = std::make_unique(", f" std::move(constants_map{i + 1}),", f" std::move(constants_array{i + 1}),", " device_str,", f' "{package_name}/data/aotinductor/{model_name}/");', f"model{i + 1}->load_constants();", ] ) if example_inputs_map is not None: ib.writeline("\n// Run the models") for i in range(len(model_names)): ib.writeline( f"torch::aot_inductor::DeviceStreamType stream{i + 1} = nullptr;" ) ib.writeline( f"model{i + 1}->run(&input_handles{i + 1}[0], &output_handle{i + 1}, stream{i + 1}, nullptr);" ) ib.writeline("\n// Convert output handles to tensors") for i in range(len(model_names)): ib.writelines( [ f"auto output_tensor{i + 1} =", f" torch::aot_inductor::alloc_tensors_by_stealing_from_handles(&output_handle{i + 1}, 1);", ] ) ib.writeline("\n// Validate outputs") for i in range(len(model_names)): ib.writeline( f"""std::cout << "output_tensor{i + 1}\\n" << output_tensor{i + 1} << std::endl;""" ) ib.writeline( f"""torch::save(output_tensor{i + 1}, "output_tensor{i + 1}.pt");""" ) ib.writeline("return 0;") ib.writelines( [ "} catch (const std::exception &e) {", ] ) with ib.indent(): ib.writeline('std::cerr << "Error: " << e.what() << std::endl;') ib.writeline("return 1;") ib.writeline("}") ib.writeline("}") return ib.getvalue() def _get_make_file(package_name: str, model_names: list[str], cuda: bool) -> str: ib = IndentedBuffer() ib.writelines( [ "cmake_minimum_required(VERSION 3.10)", "project(TestProject)", "", "set(CMAKE_CXX_STANDARD 17)", "", ] ) from torch._inductor.config import test_configs if test_configs.use_libtorch: ib.writeline("find_package(Torch REQUIRED)") if cuda: ib.writeline("find_package(CUDA REQUIRED)") ib.newline() for model_name in model_names: ib.writeline(f"add_subdirectory({package_name}/data/aotinductor/{model_name}/)") ib.writeline("\nadd_executable(main main.cpp)") if cuda: ib.writeline("target_compile_definitions(main PRIVATE USE_CUDA)") model_libs = " ".join(model_names) ib.writeline(f"target_link_libraries(main PRIVATE torch {model_libs})") if cuda: ib.writeline("target_link_libraries(main PRIVATE cuda ${CUDA_LIBRARIES})") return ib.getvalue()