1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37
|
#if !defined(C10_MOBILE) && !defined(ANDROID)
#pragma once
#include <ATen/Tensor.h>
#include <torch/csrc/inductor/aoti_runner/model_container_runner.h>
namespace torch::inductor {
class TORCH_API AOTIModelPackageLoader {
public:
AOTIModelPackageLoader(const std::string& model_package_path);
AOTIModelPackageLoader(
const std::string& model_package_path,
const std::string& model_name);
~AOTIModelPackageLoader();
AOTIModelContainerRunner* get_runner();
std::unordered_map<std::string, std::string> get_metadata();
std::vector<at::Tensor> run(
const std::vector<at::Tensor>& inputs,
void* stream_handle = nullptr);
std::vector<std::string> get_call_spec();
void load_constants(
std::unordered_map<std::string, at::Tensor>& constants_map,
bool use_inactive,
bool check_full_update);
std::vector<std::string> get_constant_fqns();
private:
std::string temp_dir_;
std::unique_ptr<AOTIModelContainerRunner> runner_;
std::unordered_map<std::string, std::string> metadata_;
void load_metadata(const std::string& cpp_filename);
};
} // namespace torch::inductor
#endif
|