cpu.c 4.73 KB
Newer Older
rusty1s's avatar
rusty1s committed
1
2
3
4
#ifndef TH_GENERIC_FILE
#define TH_GENERIC_FILE "generic/cpu.c"
#else

5
void spline_(linear_basis_forward)(THTensor *basis, THLongTensor *weight_index, THTensor *pseudo, THLongTensor *kernel_size, THByteTensor *is_open_spline, int K) {
rusty1s's avatar
rusty1s committed
6
  SPLINE_BASIS(1, basis, weight_index, pseudo, kernel_size, is_open_spline, K,
rusty1s's avatar
rusty1s committed
7
    value = (1 - k_mod) * (1 - value) + k_mod * value;
rusty1s's avatar
rusty1s committed
8
9
  )
}
rusty1s's avatar
rusty1s committed
10

11
void spline_(quadratic_basis_forward)(THTensor *basis, THLongTensor *weight_index, THTensor *pseudo, THLongTensor *kernel_size, THByteTensor *is_open_spline, int K) {
rusty1s's avatar
rusty1s committed
12
13
14
15
16
17
  SPLINE_BASIS(2, basis, weight_index, pseudo, kernel_size, is_open_spline, K,
    if (k_mod == 0) value = 0.5 * (1 - value) * (1 - value);
    else if (k_mod == 1) value = -value * value + value + 0.5;
    else value = 0.5 * value * value;
  )
}
rusty1s's avatar
rusty1s committed
18

19
void spline_(cubic_basis_forward)(THTensor *basis, THLongTensor *weight_index, THTensor *pseudo, THLongTensor *kernel_size, THByteTensor *is_open_spline, int K) {
rusty1s's avatar
rusty1s committed
20
21
22
23
24
25
  SPLINE_BASIS(3, basis, weight_index, pseudo, kernel_size, is_open_spline, K,
    if (k_mod == 0) value = (1 - value) * (1 - value) * (1 - value) / 6.0;
    else if (k_mod == 1) value = (3 * value * value * value - 6 * value * value + 4) / 6.0;
    else if (k_mod == 2) value = (-3 * value * value * value + 3 * value * value + 3 * value + 1) / 6.0;
    else value = value * value * value / 6.0;
  )
rusty1s's avatar
rusty1s committed
26
27
}

rusty1s's avatar
rusty1s committed
28
void spline_(weighting_forward)(THTensor *output, THTensor *input, THTensor *weight, THTensor *basis, THLongTensor *weight_index) {
rusty1s's avatar
rusty1s committed
29
30
31
32
  real *weight_data = weight->storage->data + weight->storageOffset;
  int64_t M_out = THTensor_(size)(output, 1);
  int64_t M_in = THTensor_(size)(input, 1);
  int64_t S = THLongTensor_size(weight_index, 1);
rusty1s's avatar
rename  
rusty1s committed
33
  int64_t m_out, m_in, s, w_idx; real b, value;
rusty1s's avatar
rusty1s committed
34
35
36
37
38
39

  TH_TENSOR_DIM_APPLY4(real, output, real, input, real, basis, int64_t, weight_index, 1,
    for (m_out = 0; m_out < M_out; m_out++) {
      value = 0;
      for (s = 0; s < S; s++) {
        b = *(basis_data + s * basis_stride);
rusty1s's avatar
rename  
rusty1s committed
40
        w_idx = *(weight_index_data + s * weight_index_stride);
rusty1s's avatar
rusty1s committed
41
        for (m_in = 0; m_in < M_in; m_in++) {
rusty1s's avatar
rename  
rusty1s committed
42
          value += b * *(weight_data + w_idx * M_in * M_out + m_in * M_out + m_out) * *(input_data + m_in * input_stride);
rusty1s's avatar
rusty1s committed
43
44
45
46
47
        }
      }
      output_data[m_out * output_stride] = value;
    }
  )
rusty1s's avatar
rusty1s committed
48
49
}

50
51
52
void spline_(weighting_backward_input)(THTensor *grad_input, THTensor *grad_output, THTensor *weight, THTensor *basis, THLongTensor *weight_index) {
  real *weight_data = weight->storage->data + weight->storageOffset; real b;
  SPLINE_WEIGHTING_BACKWARD(grad_input, grad_output, basis, weight_index, THTensor_(size)(grad_input, 1), THTensor_(size)(grad_output, 1), THLongTensor_size(weight_index, 1),
rusty1s's avatar
rusty1s committed
53
    for (m_in = 0; m_in < M_in; m_in++) {
54
      value = 0;
rusty1s's avatar
rusty1s committed
55
56
      for (s = 0; s < S; s++) {
        b = *(basis_data + s * basis_stride);
rusty1s's avatar
rename  
rusty1s committed
57
        w_idx = *(weight_index_data + s * weight_index_stride);
rusty1s's avatar
rusty1s committed
58
        for (m_out = 0; m_out < M_out; m_out++) {
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
          value += b * *(grad_output_data + m_out * grad_output_stride) * *(weight_data + w_idx * M_in * M_out + m_in * M_out + m_out);
        }
      }
      grad_input_data[m_in] = value;
    }
  )
}

void spline_(weighting_backward_weight)(THTensor *grad_weight, THTensor *grad_output, THTensor *input, THTensor *basis, THLongTensor *weight_index) {
  real *grad_weight_data = grad_weight->storage->data + grad_weight->storageOffset; real b;
  SPLINE_WEIGHTING_BACKWARD(grad_output, input, basis, weight_index, THTensor_(size)(grad_output, 1), THTensor_(size)(input, 1), THLongTensor_size(weight_index, 1),
    for (m_out = 0; m_out < M_out; m_out++) {
      value = *(grad_output_data + m_out * grad_output_stride);
      for (s = 0; s < S; s++) {
        b = *(basis_data + s * basis_stride);
        w_idx = *(weight_index_data + s * weight_index_stride);
        for (m_in = 0; m_in < M_in; m_in++) {
          grad_weight_data[w_idx * M_in * M_out + m_in * M_out + m_out] += b * value * *(input_data + m_in * input_stride);
        }
      }
    }
  )
}

void spline_(weighting_backward_basis)(THTensor *grad_basis, THTensor *grad_output, THTensor *input, THTensor *weight, THLongTensor *weight_index) {
  real *weight_data = weight->storage->data + weight->storageOffset;
  SPLINE_WEIGHTING_BACKWARD(grad_basis, grad_output, input, weight_index, THTensor_(size)(grad_output, 1), THTensor_(size)(input, 1), THLongTensor_size(weight_index, 1),
    for (m_out = 0; m_out < M_out; m_out++) {
      for (s = 0; s < S; s++) {
        w_idx = *(weight_index_data + s * weight_index_stride); value = 0;
        for (m_in = 0; m_in < M_in; m_in++) {
          value += *(input_data + m_in * input_stride) * *(weight_data + w_idx * M_in * M_out + m_in * M_out + m_out);
rusty1s's avatar
rusty1s committed
91
        }
92
        grad_basis_data[s] += value * *(grad_output_data + m_out * grad_output_stride);
rusty1s's avatar
rusty1s committed
93
94
      }
    }
rusty1s's avatar
rusty1s committed
95
  )
rusty1s's avatar
rusty1s committed
96
97
}

rusty1s's avatar
rusty1s committed
98
#endif