Updated the padding code to work with half floats

This commit is contained in:
Benoit Steiner 2016-02-23 05:51:22 +00:00
parent 8cb9bfab87
commit 1d9256f7db

View File

@ -151,27 +151,27 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
for (int i = NumDims - 1; i > 0; --i) { for (int i = NumDims - 1; i > 0; --i) {
const Index idx = index / m_outputStrides[i]; const Index idx = index / m_outputStrides[i];
if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) { if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (idx - m_padding[i].first) * m_inputStrides[i]; inputIndex += (idx - m_padding[i].first) * m_inputStrides[i];
index -= idx * m_outputStrides[i]; index -= idx * m_outputStrides[i];
} }
if (index < m_padding[0].first || index >= m_dimensions[0] - m_padding[0].second) { if (index < m_padding[0].first || index >= m_dimensions[0] - m_padding[0].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (index - m_padding[0].first); inputIndex += (index - m_padding[0].first);
} else { } else {
for (int i = 0; i < NumDims - 1; ++i) { for (int i = 0; i < NumDims - 1; ++i) {
const Index idx = index / m_outputStrides[i+1]; const Index idx = index / m_outputStrides[i+1];
if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) { if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (idx - m_padding[i].first) * m_inputStrides[i]; inputIndex += (idx - m_padding[i].first) * m_inputStrides[i];
index -= idx * m_outputStrides[i+1]; index -= idx * m_outputStrides[i+1];
} }
if (index < m_padding[NumDims-1].first || if (index < m_padding[NumDims-1].first ||
index >= m_dimensions[NumDims-1] - m_padding[NumDims-1].second) { index >= m_dimensions[NumDims-1] - m_padding[NumDims-1].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (index - m_padding[NumDims-1].first); inputIndex += (index - m_padding[NumDims-1].first);
} }
@ -194,14 +194,14 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
{ {
const Index idx = coords[0]; const Index idx = coords[0];
if (idx < m_padding[0].first || idx >= m_dimensions[0] - m_padding[0].second) { if (idx < m_padding[0].first || idx >= m_dimensions[0] - m_padding[0].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex = idx - m_padding[0].first; inputIndex = idx - m_padding[0].first;
} }
for (int i = 1; i < NumDims; ++i) { for (int i = 1; i < NumDims; ++i) {
const Index idx = coords[i]; const Index idx = coords[i];
if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) { if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (idx - m_padding[i].first) * m_inputStrides[i]; inputIndex += (idx - m_padding[i].first) * m_inputStrides[i];
} }
@ -209,14 +209,14 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
{ {
const Index idx = coords[NumDims-1]; const Index idx = coords[NumDims-1];
if (idx < m_padding[NumDims-1].first || idx >= m_dimensions[NumDims-1] - m_padding[NumDims-1].second) { if (idx < m_padding[NumDims-1].first || idx >= m_dimensions[NumDims-1] - m_padding[NumDims-1].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex = idx - m_padding[NumDims-1].first; inputIndex = idx - m_padding[NumDims-1].first;
} }
for (int i = NumDims - 2; i >= 0; --i) { for (int i = NumDims - 2; i >= 0; --i) {
const Index idx = coords[i]; const Index idx = coords[i];
if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) { if (idx < m_padding[i].first || idx >= m_dimensions[i] - m_padding[i].second) {
return Scalar(0); return internal::scalar_cast_op<int, Scalar>()(0);
} }
inputIndex += (idx - m_padding[i].first) * m_inputStrides[i]; inputIndex += (idx - m_padding[i].first) * m_inputStrides[i];
} }
@ -245,11 +245,11 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
if (last < lastPaddedLeft) { if (last < lastPaddedLeft) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= firstPaddedRight && last < lastPaddedRight) { else if (first >= firstPaddedRight && last < lastPaddedRight) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= lastPaddedLeft && last < firstPaddedRight) { else if (first >= lastPaddedLeft && last < firstPaddedRight) {
// all the coefficient are between the 2 padding zones. // all the coefficient are between the 2 padding zones.
@ -271,11 +271,11 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
if (last < lastPaddedLeft) { if (last < lastPaddedLeft) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= firstPaddedRight && last < lastPaddedRight) { else if (first >= firstPaddedRight && last < lastPaddedRight) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= lastPaddedLeft && last < firstPaddedRight) { else if (first >= lastPaddedLeft && last < firstPaddedRight) {
// all the coefficient are between the 2 padding zones. // all the coefficient are between the 2 padding zones.
@ -304,11 +304,11 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
if (last < lastPaddedLeft) { if (last < lastPaddedLeft) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= firstPaddedRight && last < lastPaddedRight) { else if (first >= firstPaddedRight && last < lastPaddedRight) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= lastPaddedLeft && last < firstPaddedRight) { else if (first >= lastPaddedLeft && last < firstPaddedRight) {
// all the coefficient are between the 2 padding zones. // all the coefficient are between the 2 padding zones.
@ -330,11 +330,11 @@ struct TensorEvaluator<const TensorPaddingOp<PaddingDimensions, ArgType>, Device
if (last < lastPaddedLeft) { if (last < lastPaddedLeft) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= firstPaddedRight && last < lastPaddedRight) { else if (first >= firstPaddedRight && last < lastPaddedRight) {
// all the coefficient are in the padding zone. // all the coefficient are in the padding zone.
return internal::pset1<PacketReturnType>(Scalar(0)); return internal::pset1<PacketReturnType>(internal::scalar_cast_op<int, Scalar>()(0));
} }
else if (first >= lastPaddedLeft && last < firstPaddedRight) { else if (first >= lastPaddedLeft && last < firstPaddedRight) {
// all the coefficient are between the 2 padding zones. // all the coefficient are between the 2 padding zones.