kulinseth · Ronian526 · Jan 18, 2023 · Jan 12, 2023 · Jan 12, 2023 · Jan 14, 2023
@@ -96,10 +96,12 @@ static inline MTLLanguageVersion getMetalLanguageVersion(const id<MTLDevice>& de
  static bool _macos_13_0_plus = [mpsCD instancesRespondToSelector:@selector(cumulativeSumWithTensor:axis:name:)] == YES;
  static bool _macos_13_1_plus = [mpsCD instancesRespondToSelector:@selector(
  sampleGridWithSourceTensor:coordinateTensor:layout:normalizeCoordinates:relativeCoordinates:alignCorners:paddingMode:samplingMode:constantValue:name:)] == YES;
+ static bool _macos_13_2_plus = [mpsCD instancesRespondToSelector:@selector(convolution3DWithSourceTensor:weightsTensor:descriptor:name:)] == YES;
 
  switch (subVersion) {
  case 0: return _macos_13_0_plus;
  case 1: return _macos_13_1_plus;
+ case 2: return _macos_13_2_plus;
  default: return false;
  }
 }

@@ -27,6 +27,10 @@
 void binaryOpTensor(const Tensor& self, const Tensor& other, const Scalar& alpha,
  const Tensor& output_, std::string op_name, BinaryOpBlock binaryBlock)
 {
+ TORCH_CHECK(!(op_name == "power" && !is_macos_13_or_newer(2) &&
+ (self.scalar_type() == ScalarType::Long ||
+ (other.scalar_type() == ScalarType::Long && (self.scalar_type() != ScalarType::Half && self.scalar_type() != ScalarType::Float)))),
+ "MPS: ", op_name, " op with int64 input is supported natively starting from macOS 13.2");
  MPSStream* mpsStream = getCurrentMPSStream();
 
  const bool is_self_scalar = self.dim() == 0;
@@ -246,7 +250,7 @@ void add_sub_template(const Tensor& self, const Tensor& other, const Scalar& alp
 #define CREATE_MPS_STRUCTURED_BINARY_OP_FUNC(func_out, func_stub, other_type) \
 TORCH_IMPL_FUNC(func_out) (const Tensor& self, const other_type& other, const Tensor& output) { \
  TORCH_CHECK(!(self.scalar_type() == ScalarType::Long && \
- (std::string(#func_stub) == "power" || std::string(#func_stub) == "atan2")), \
+ std::string(#func_stub) == "atan2"),  \
  "MPS does not support ", #func_stub, " op with int64 input") \
  mps::binaryOp##other_type(self, other, Scalar(1.0), output, #func_stub, \
  ^BinaryOpFn(cachedGraph, primaryCastTensor, secondaryCastTensor) { \

@@ -9034,7 +9034,7 @@ class TestConsistency(TestCase):
  'i64',
  'u8'],
  'sqrt': ['b8', 'f32', 'i16', 'i32', 'i64', 'u8'],
- 'square': ['f16', 'f32'],
+ 'square': ['b8', 'f16', 'f32', 'i16', 'i32', 'i64', 'u8'],
  'squeeze': ['b8', 'f16', 'f32', 'i16', 'i32', 'i64', 'u8'],
  'stack': ['b8', 'f16', 'f32', 'i16', 'i32', 'i64', 'u8'],
  'std': ['f16', 'f32'],
@@ -9280,7 +9280,6 @@ class TestConsistency(TestCase):
  'nn.functional.interpolatearea': [torch.float32],
  'resize_as_': [torch.float16, torch.float32],
  'topk': [torch.int16, torch.int32, torch.int64, torch.uint8],
- 'square': [torch.bool, torch.int16, torch.int32, torch.int64, torch.uint8],
 
  # Functions with correctness issues
  'unique': [torch.bool, torch.float16, torch.float32, torch.int16, torch.int32, torch.int64, torch.uint8],