Update TensorImpl constructor to take the tensor dimensions instead of the number of elements.
Compare changes
@@ -69,12 +69,13 @@ private:
@@ -69,12 +69,13 @@ private:
TensorImpl_cuda(DeviceIdx_t device, NbElts_t length) : TensorImpl(Backend, device, length), mDataOwner(nullptr, cudaDelete) {}