[executorch] Add RuntimeContext to generated C++ API Signature (#94570)
Summary:
Pass runtime context all the way to kernel level.
RegisterCodegenUnboxedKernels.cpp:
```
static Operator operators_to_register[] = {
Operator(
"aten::add.out",
[](torch::executor::RuntimeContext & context, EValue** stack) {
EValue& self = *stack[0];
EValue& other = *stack[1];
EValue& alpha = *stack[2];
EValue& out = *stack[3];
const torch::executor::Tensor & self_base = self.to<torch::executor::Tensor>();
const torch::executor::Tensor & other_base = other.to<torch::executor::Tensor>();
const torch::executor::Scalar & alpha_base = alpha.to<torch::executor::Scalar>();
torch::executor::Tensor & out_base = out.to<torch::executor::Tensor>();
EXECUTORCH_SCOPE_PROF("native_call_add.out");
torch::executor::aten::add_outf(context, self_base, other_base, alpha_base, out_base);
}
),
}
```
Functions.h
```
// aten::add.out(Tensor self, Tensor other, *, Scalar alpha=1, Tensor(a!) out) -> Tensor(a!)
TORCH_API inline at::Tensor & add_outf(torch::executor::RuntimeContext & context, const at::Tensor & self, const at::Tensor & other, const at::Scalar & alpha, at::Tensor & out) {
return torch::executor::native::add_out(self, other, alpha, out);
}
```
Test Plan: TBD
Differential Revision: D41325633
Pull Request resolved: https://github.com/pytorch/pytorch/pull/94570
Approved by: https://github.com/cccclai