forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathFusedAdagrad.cpp
59 lines (54 loc) · 1.46 KB
/
FusedAdagrad.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#define TORCH_ASSERT_ONLY_METHOD_OPERATORS
#include <ATen/core/Tensor.h>
#include <ATen/native/DispatchStub.h>
#include <ATen/native/FusedAdagrad.h>
#ifndef AT_PER_OPERATOR_HEADERS
#include <ATen/Functions.h>
#include <ATen/NativeFunctions.h>
#else
#include <ATen/ops/_fused_adagrad.h>
#include <ATen/ops/_fused_adagrad_native.h>
#endif
namespace at {
namespace native {
void _fused_adagrad_kernel_cpu_(
at::TensorList params,
at::TensorList grads,
at::TensorList state_sums,
at::TensorList state_steps,
const double lr,
const double lr_decay,
const double weight_decay,
const double eps,
const bool maximize,
const std::optional<at::Tensor>& grad_scale,
const std::optional<at::Tensor>& found_inf) {
const float* grad_scale_ptr =
grad_scale.has_value() ? grad_scale->data_ptr<float>() : nullptr;
const float* found_inf_ptr =
found_inf.has_value() ? found_inf->data_ptr<float>() : nullptr;
if (found_inf_ptr && *found_inf_ptr == 1.0) {
return;
}
size_t n_tensors = params.size();
TORCH_CHECK(grads.size() == n_tensors);
TORCH_CHECK(state_sums.size() == n_tensors);
TORCH_CHECK(state_steps.size() == n_tensors);
for (size_t i = 0; i < n_tensors; i++){
fused_adagrad_stub(
kCPU,
params[i],
grads[i],
state_sums[i],
state_steps[i],
lr,
lr_decay,
weight_decay,
eps,
maximize,
grad_scale_ptr);
}
}
DEFINE_DISPATCH(fused_adagrad_stub);
}
}