arda-argmax commited on Mar 29

Commit

ab5bc64

verified ·

1 Parent(s): a6fb336

New pyannote-v3-pro (#1)

- New pyannote-v3-pro (8c02f5e91862b3bf8a4e23ca79c301196423d673)
- New pyannote-v3-pro SpeakerSegmenter (5ea9592772d00d547da99ae3f7e5c958c78deb9f)
- Update speaker_embedder/pyannote-v3-pro/LICENSE_NOTICE.txt (c5a4c6722d64a288af1864a70f91a2930cf1aa08)
- Update speaker_embedder/pyannote-v3-pro/W16A16/LICENSE_NOTICE.txt (374499d2f345de69a51a7c2567e0e462514ff7b8)
- Update speaker_embedder/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt (f1960989a5088756b8cbfdde1fa9c75bd7c1adcd)
- Update speaker_segmenter/pyannote-v3-pro/LICENSE_NOTICE.txt (f6b4119078515307b830d24254f50a766df950fd)
- Update speaker_segmenter/pyannote-v3-pro/W32A32/LICENSE_NOTICE.txt (b6731a299fd0f81f5617aaf6f246d62722ddafa2)
- Update speaker_segmenter/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt (d82d6c440f605ad1dcb58d7925aac3a233118131)
- Delete speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbeddingPreprocessor.mlmodelc (c79f308c1ca50c9e24487d0c18f43820c06d2b1b)
- Delete speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbeddingPreprocessor.mlmodelc (9b92fca14e181a18c573d15e92f3c15ee45ddb3a)
- pyannote-v3-pro W16A16 SpeakerEmbedderPreprocessor (acdfedd1ec4e0a8802af60c32a3e41dd115e0494)
- pyannote-v3-pro W8A16 SpeakerEmbedderPreprocessor (29c808ac698e3a6c48f752a05162321f1883f57e)

Files changed (42) hide show

speaker_embedder/pyannote-v3-pro/LICENSE_NOTICE.txt +7 -0
speaker_embedder/pyannote-v3-pro/README.txt +6 -0
speaker_embedder/pyannote-v3-pro/W16A16/LICENSE_NOTICE.txt +7 -0
speaker_embedder/pyannote-v3-pro/W16A16/README.txt +6 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/analytics/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/metadata.json +86 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/model.mil +0 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/weights/weight.bin +3 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/analytics/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/metadata.json +77 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/model.mil +90 -0
speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/weights/weight.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt +7 -0
speaker_embedder/pyannote-v3-pro/W8A16/README.txt +6 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/analytics/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/metadata.json +87 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/model.mil +0 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/weights/weight.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/analytics/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/coremldata.bin +3 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/metadata.json +77 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/model.mil +90 -0
speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/weights/weight.bin +3 -0
speaker_segmenter/pyannote-v3-pro/LICENSE_NOTICE.txt +7 -0
speaker_segmenter/pyannote-v3-pro/README.txt +6 -0
speaker_segmenter/pyannote-v3-pro/W32A32/LICENSE_NOTICE.txt +7 -0
speaker_segmenter/pyannote-v3-pro/W32A32/README.txt +6 -0
speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/analytics/coremldata.bin +3 -0
speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/coremldata.bin +3 -0
speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/metadata.json +144 -0
speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/model.mil +0 -0
speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/weights/weight.bin +3 -0
speaker_segmenter/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt +7 -0
speaker_segmenter/pyannote-v3-pro/W8A16/README.txt +6 -0
speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/analytics/coremldata.bin +3 -0
speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/coremldata.bin +3 -0
speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/metadata.json +145 -0
speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/model.mil +0 -0
speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/weights/weight.bin +3 -0

speaker_embedder/pyannote-v3-pro/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_embedder/pyannote-v3-pro/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://github.com/wenet-e2e/wespeaker/blob/master/docs/pretrained.md#model-license
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_embedder/pyannote-v3-pro/W16A16/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_embedder/pyannote-v3-pro/W16A16/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://github.com/wenet-e2e/wespeaker/blob/master/docs/pretrained.md#model-license
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:31ebd86f9f3a87ee2bb1aa32722968e3f6821d6b393171bb6b92683213f173e1
+size 243

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bbb69d66cdb7f69a6c9d4dc1ff9b114d6097bb69581e12a706cf16e27ce10be
+size 370

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,86 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Float16",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 64 × 256)",
+        "shortDescription" : "",
+        "shape" : "[1, 64, 256]",
+        "name" : "speaker_embeddings",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Concat" : 64,
+      "Ios16.mul" : 256,
+      "SliceByIndex" : 64,
+      "Transpose" : 1,
+      "Ios16.sub" : 128,
+      "Ios16.sqrt" : 64,
+      "Stack" : 1,
+      "UpsampleNearestNeighbor" : 1,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 144,
+      "Squeeze" : 1,
+      "Ios16.relu" : 33,
+      "Ios16.realDiv" : 192,
+      "Ios16.reduceSum" : 256,
+      "ExpandDims" : 130,
+      "Ios16.linear" : 1,
+      "Ios16.reshape" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.version" : "8.2",
+      "com.github.apple.coremltools.source" : "torch==2.6.0"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 998 × 80)",
+        "shortDescription" : "",
+        "shape" : "[1, 998, 80]",
+        "name" : "preprocessor_output_1",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 64 × 589)",
+        "shortDescription" : "",
+        "shape" : "[1, 64, 589]",
+        "name" : "speaker_masks",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerEmbedding",
+    "method" : "predict"
+  }
+]

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6dba18a57a81b1e872802ca4def29541bb7900ccff430d9b2040092cadd7d688
+size 13264960

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1383750df1af99af002f0c3403bcf19a18c3d749706eb3498d34b0fe01abf2fc
+size 243

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc230803421bf4fe14f843ea5b5fa0035487fd19cdd69ed670d72560b6a44586
+size 330

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,77 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Float32",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 2998 × 80)",
+        "shortDescription" : "",
+        "shape" : "[1, 2998, 80]",
+        "name" : "preprocessor_output_1",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 2,
+      "Ios16.mul" : 4,
+      "SliceByIndex" : 2,
+      "Transpose" : 2,
+      "SlidingWindows" : 1,
+      "Ios16.sub" : 3,
+      "Ios16.log" : 1,
+      "Ios16.reduceMean" : 2,
+      "Ios16.square" : 2,
+      "Squeeze" : 2,
+      "Ios16.matmul" : 2,
+      "Ios16.add" : 1,
+      "Ios16.linear" : 1,
+      "ExpandDims" : 4,
+      "Ios16.gather" : 2,
+      "Ios16.maximum" : 1,
+      "Identity" : 1,
+      "Pad" : 2
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.6.0",
+      "com.github.apple.coremltools.version" : "8.2"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 480000)",
+        "shortDescription" : "",
+        "shape" : "[1, 480000]",
+        "name" : "waveforms",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerEmbeddingPreprocessor",
+    "method" : "predict"
+  }
+]

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/model.mil ADDED Viewed

	@@ -0,0 +1,90 @@

+program(1.0)
+[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3402.3.2"}, {"coremlc-version", "3402.4.1"}, {"coremltools-component-torch", "2.6.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.2"}})]
+{
+    func main<ios16>(tensor<fp16, [1, 480000]> waveforms) {
+            tensor<string, []> cast_0_dtype_0 = const()[name = tensor<string, []>("cast_0_dtype_0"), val = tensor<string, []>("fp32")];
+            tensor<fp32, []> var_2_promoted = const()[name = tensor<string, []>("op_2_promoted"), val = tensor<fp32, []>(0x1p+15)];
+            tensor<fp32, [1, 480000]> cast_0 = cast(dtype = cast_0_dtype_0, x = waveforms)[name = tensor<string, []>("cast_11")];
+            tensor<fp32, [1, 480000]> waveform_1 = mul(x = cast_0, y = var_2_promoted)[name = tensor<string, []>("waveform_1")];
+            tensor<int32, [2]> var_6_begin_0 = const()[name = tensor<string, []>("op_6_begin_0"), val = tensor<int32, [2]>([0, 0])];
+            tensor<int32, [2]> var_6_end_0 = const()[name = tensor<string, []>("op_6_end_0"), val = tensor<int32, [2]>([1, 480000])];
+            tensor<bool, [2]> var_6_end_mask_0 = const()[name = tensor<string, []>("op_6_end_mask_0"), val = tensor<bool, [2]>([false, true])];
+            tensor<bool, [2]> var_6_squeeze_mask_0 = const()[name = tensor<string, []>("op_6_squeeze_mask_0"), val = tensor<bool, [2]>([true, false])];
+            tensor<fp32, [480000]> var_6 = slice_by_index(begin = var_6_begin_0, end = var_6_end_0, end_mask = var_6_end_mask_0, squeeze_mask = var_6_squeeze_mask_0, x = waveform_1)[name = tensor<string, []>("op_6")];
+            tensor<int32, []> sliding_windows_0_axis_0 = const()[name = tensor<string, []>("sliding_windows_0_axis_0"), val = tensor<int32, []>(0)];
+            tensor<int32, []> sliding_windows_0_size_0 = const()[name = tensor<string, []>("sliding_windows_0_size_0"), val = tensor<int32, []>(400)];
+            tensor<int32, []> sliding_windows_0_stride_0 = const()[name = tensor<string, []>("sliding_windows_0_stride_0"), val = tensor<int32, []>(160)];
+            tensor<fp32, [2998, 400]> sliding_windows_0 = sliding_windows(axis = sliding_windows_0_axis_0, size = sliding_windows_0_size_0, stride = sliding_windows_0_stride_0, x = var_6)[name = tensor<string, []>("sliding_windows_0")];
+            tensor<int32, [1]> var_42_axes_0 = const()[name = tensor<string, []>("op_42_axes_0"), val = tensor<int32, [1]>([1])];
+            tensor<bool, []> var_42_keep_dims_0 = const()[name = tensor<string, []>("op_42_keep_dims_0"), val = tensor<bool, []>(false)];
+            tensor<fp32, [2998]> var_42 = reduce_mean(axes = var_42_axes_0, keep_dims = var_42_keep_dims_0, x = sliding_windows_0)[name = tensor<string, []>("op_42")];
+            tensor<int32, [1]> row_means_axes_0 = const()[name = tensor<string, []>("row_means_axes_0"), val = tensor<int32, [1]>([1])];
+            tensor<fp32, [2998, 1]> row_means = expand_dims(axes = row_means_axes_0, x = var_42)[name = tensor<string, []>("row_means")];
+            tensor<fp32, [2998, 400]> strided_input_3 = sub(x = sliding_windows_0, y = row_means)[name = tensor<string, []>("strided_input_3")];
+            tensor<int32, [1]> input_1_axes_0 = const()[name = tensor<string, []>("input_1_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 400]> input_1 = expand_dims(axes = input_1_axes_0, x = strided_input_3)[name = tensor<string, []>("input_1")];
+            tensor<fp32, []> const_2 = const()[name = tensor<string, []>("const_2"), val = tensor<fp32, []>(0x0p+0)];
+            tensor<int32, [6]> var_54_pad_0 = const()[name = tensor<string, []>("op_54_pad_0"), val = tensor<int32, [6]>([0, 0, 0, 0, 1, 0])];
+            tensor<string, []> var_54_mode_0 = const()[name = tensor<string, []>("op_54_mode_0"), val = tensor<string, []>("replicate")];
+            tensor<fp32, [1, 2998, 401]> var_54 = pad(constant_val = const_2, mode = var_54_mode_0, pad = var_54_pad_0, x = input_1)[name = tensor<string, []>("op_54")];
+            tensor<int32, [1]> offset_strided_input_axes_0 = const()[name = tensor<string, []>("offset_strided_input_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [2998, 401]> offset_strided_input = squeeze(axes = offset_strided_input_axes_0, x = var_54)[name = tensor<string, []>("offset_strided_input")];
+            tensor<int32, [2]> var_66_begin_0 = const()[name = tensor<string, []>("op_66_begin_0"), val = tensor<int32, [2]>([0, 0])];
+            tensor<int32, [2]> var_66_end_0 = const()[name = tensor<string, []>("op_66_end_0"), val = tensor<int32, [2]>([2998, 400])];
+            tensor<bool, [2]> var_66_end_mask_0 = const()[name = tensor<string, []>("op_66_end_mask_0"), val = tensor<bool, [2]>([true, false])];
+            tensor<fp32, [2998, 400]> var_66 = slice_by_index(begin = var_66_begin_0, end = var_66_end_0, end_mask = var_66_end_mask_0, x = offset_strided_input)[name = tensor<string, []>("op_66")];
+            tensor<fp32, []> var_67 = const()[name = tensor<string, []>("op_67"), val = tensor<fp32, []>(0x1.f0a3d8p-1)];
+            tensor<fp32, [2998, 400]> var_68 = mul(x = var_66, y = var_67)[name = tensor<string, []>("op_68")];
+            tensor<fp32, [2998, 400]> strided_input_5 = sub(x = strided_input_3, y = var_68)[name = tensor<string, []>("strided_input_5")];
+            tensor<fp32, [1, 400]> window_function = const()[name = tensor<string, []>("window_function"), val = tensor<fp32, [1, 400]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
+            tensor<fp32, [2998, 400]> strided_input_7 = mul(x = strided_input_5, y = window_function)[name = tensor<string, []>("strided_input_7")];
+            tensor<int32, [1]> input_3_axes_0 = const()[name = tensor<string, []>("input_3_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 400]> input_3 = expand_dims(axes = input_3_axes_0, x = strided_input_7)[name = tensor<string, []>("input_3")];
+            tensor<fp32, []> const_3 = const()[name = tensor<string, []>("const_3"), val = tensor<fp32, []>(0x0p+0)];
+            tensor<int32, [6]> var_90_pad_0 = const()[name = tensor<string, []>("op_90_pad_0"), val = tensor<int32, [6]>([0, 0, 0, 0, 0, 112])];
+            tensor<string, []> var_90_mode_0 = const()[name = tensor<string, []>("op_90_mode_0"), val = tensor<string, []>("constant")];
+            tensor<fp32, [1, 2998, 512]> var_90 = pad(constant_val = const_3, mode = var_90_mode_0, pad = var_90_pad_0, x = input_3)[name = tensor<string, []>("op_90")];
+            tensor<int32, [1]> strided_input_axes_0 = const()[name = tensor<string, []>("strided_input_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [2998, 512]> strided_input = squeeze(axes = strided_input_axes_0, x = var_90)[name = tensor<string, []>("strided_input")];
+            tensor<fp32, [512, 512]> cos_0 = const()[name = tensor<string, []>("cos_0"), val = tensor<fp32, [512, 512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1728)))];
+            tensor<fp32, [512, 512]> sin_0 = const()[name = tensor<string, []>("sin_0"), val = tensor<fp32, [512, 512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1050368)))];
+            tensor<bool, []> matmul_1_transpose_x_1 = const()[name = tensor<string, []>("matmul_1_transpose_x_1"), val = tensor<bool, []>(false)];
+            tensor<bool, []> matmul_1_transpose_y_1 = const()[name = tensor<string, []>("matmul_1_transpose_y_1"), val = tensor<bool, []>(true)];
+            tensor<fp32, [512, 2998]> matmul_1 = matmul(transpose_x = matmul_1_transpose_x_1, transpose_y = matmul_1_transpose_y_1, x = cos_0, y = strided_input)[name = tensor<string, []>("matmul_1")];
+            tensor<bool, []> matmul_3_transpose_x_1 = const()[name = tensor<string, []>("matmul_3_transpose_x_1"), val = tensor<bool, []>(false)];
+            tensor<bool, []> matmul_3_transpose_y_1 = const()[name = tensor<string, []>("matmul_3_transpose_y_1"), val = tensor<bool, []>(true)];
+            tensor<fp32, [512, 2998]> matmul_3 = matmul(transpose_x = matmul_3_transpose_x_1, transpose_y = matmul_3_transpose_y_1, x = sin_0, y = strided_input)[name = tensor<string, []>("matmul_3")];
+            tensor<fp32, []> mul_1_y_0 = const()[name = tensor<string, []>("mul_1_y_0"), val = tensor<fp32, []>(-0x1p+0)];
+            tensor<fp32, [512, 2998]> mul_1 = mul(x = matmul_3, y = mul_1_y_0)[name = tensor<string, []>("mul_1")];
+            tensor<int32, [2]> transpose_3_perm_0 = const()[name = tensor<string, []>("transpose_3_perm_0"), val = tensor<int32, [2]>([-1, 0])];
+            tensor<int32, [2]> transpose_4_perm_0 = const()[name = tensor<string, []>("transpose_4_perm_0"), val = tensor<int32, [2]>([-1, 0])];
+            tensor<int32, [257]> range_1d_2 = const()[name = tensor<string, []>("range_1d_2"), val = tensor<int32, [257]>([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256])];
+            tensor<int32, []> gather_0_axis_0 = const()[name = tensor<string, []>("gather_0_axis_0"), val = tensor<int32, []>(-1)];
+            tensor<int32, []> gather_0_batch_dims_0 = const()[name = tensor<string, []>("gather_0_batch_dims_0"), val = tensor<int32, []>(0)];
+            tensor<fp32, [2998, 512]> transpose_3 = transpose(perm = transpose_3_perm_0, x = matmul_1)[name = tensor<string, []>("transpose_6")];
+            tensor<fp32, [2998, 257]> gather_0 = gather(axis = gather_0_axis_0, batch_dims = gather_0_batch_dims_0, indices = range_1d_2, x = transpose_3)[name = tensor<string, []>("gather_0")];
+            tensor<int32, []> gather_1_axis_0 = const()[name = tensor<string, []>("gather_1_axis_0"), val = tensor<int32, []>(-1)];
+            tensor<int32, []> gather_1_batch_dims_0 = const()[name = tensor<string, []>("gather_1_batch_dims_0"), val = tensor<int32, []>(0)];
+            tensor<fp32, [2998, 512]> transpose_4 = transpose(perm = transpose_4_perm_0, x = mul_1)[name = tensor<string, []>("transpose_5")];
+            tensor<fp32, [2998, 257]> gather_1 = gather(axis = gather_1_axis_0, batch_dims = gather_1_batch_dims_0, indices = range_1d_2, x = transpose_4)[name = tensor<string, []>("gather_1")];
+            tensor<fp32, [2998, 257]> square_0 = square(x = gather_0)[name = tensor<string, []>("square_0")];
+            tensor<fp32, [2998, 257]> square_1 = square(x = gather_1)[name = tensor<string, []>("square_1")];
+            tensor<fp32, [2998, 257]> add_1 = add(x = square_0, y = square_1)[name = tensor<string, []>("add_1")];
+            tensor<fp32, [2998, 257]> spectrum = identity(x = add_1)[name = tensor<string, []>("spectrum")];
+            tensor<fp32, [80, 257]> mel_energies_3 = const()[name = tensor<string, []>("mel_energies_3"), val = tensor<fp32, [80, 257]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2099008)))];
+            tensor<fp32, [80]> mel_energies_bias_0 = const()[name = tensor<string, []>("mel_energies_bias_0"), val = tensor<fp32, [80]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2181312)))];
+            tensor<fp32, [2998, 80]> mel_energies = linear(bias = mel_energies_bias_0, weight = mel_energies_3, x = spectrum)[name = tensor<string, []>("mel_energies")];
+            tensor<fp32, []> const_10 = const()[name = tensor<string, []>("const_10"), val = tensor<fp32, []>(0x1p-23)];
+            tensor<fp32, [2998, 80]> var_186 = maximum(x = mel_energies, y = const_10)[name = tensor<string, []>("op_186")];
+            tensor<fp32, []> filter_banks_epsilon_0 = const()[name = tensor<string, []>("filter_banks_epsilon_0"), val = tensor<fp32, []>(0x1p-149)];
+            tensor<fp32, [2998, 80]> filter_banks = log(epsilon = filter_banks_epsilon_0, x = var_186)[name = tensor<string, []>("filter_banks")];
+            tensor<int32, [1]> var_192_axes_0 = const()[name = tensor<string, []>("op_192_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<bool, []> var_192_keep_dims_0 = const()[name = tensor<string, []>("op_192_keep_dims_0"), val = tensor<bool, []>(true)];
+            tensor<fp32, [1, 80]> var_192 = reduce_mean(axes = var_192_axes_0, keep_dims = var_192_keep_dims_0, x = filter_banks)[name = tensor<string, []>("op_192")];
+            tensor<fp32, [2998, 80]> var_194 = sub(x = filter_banks, y = var_192)[name = tensor<string, []>("op_194")];
+            tensor<int32, [1]> obj_axes_0 = const()[name = tensor<string, []>("obj_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 80]> preprocessor_output_1_type_fp32 = expand_dims(axes = obj_axes_0, x = var_194)[name = tensor<string, []>("obj")];
+            tensor<string, []> cast_9_dtype_0 = const()[name = tensor<string, []>("cast_9_dtype_0"), val = tensor<string, []>("fp16")];
+            tensor<fp16, [1, 2998, 80]> preprocessor_output_1 = cast(dtype = cast_9_dtype_0, x = preprocessor_output_1_type_fp32)[name = tensor<string, []>("cast_10")];
+        } -> (preprocessor_output_1);
+}

speaker_embedder/pyannote-v3-pro/W16A16/SpeakerEmbedderPreprocessor.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f2c284bd22f1f7ab76901c1c6e57f82d4ebbf057fa0b924aad057f124f77a89
+size 2181696

speaker_embedder/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_embedder/pyannote-v3-pro/W8A16/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://github.com/wenet-e2e/wespeaker/blob/master/docs/pretrained.md#model-license
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:642e75621f11e461372ebf68c2861b4d56b48b89027295cfac05b518f88fc8f7
+size 243

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bbb69d66cdb7f69a6c9d4dc1ff9b114d6097bb69581e12a706cf16e27ce10be
+size 370

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,87 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Mixed (Float16, Palettized (8 bits))",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 64 × 256)",
+        "shortDescription" : "",
+        "shape" : "[1, 64, 256]",
+        "name" : "speaker_embeddings",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Concat" : 64,
+      "Ios16.mul" : 256,
+      "SliceByIndex" : 64,
+      "Ios16.constexprLutToDense" : 35,
+      "Transpose" : 1,
+      "Ios16.sub" : 128,
+      "Ios16.sqrt" : 64,
+      "Stack" : 1,
+      "UpsampleNearestNeighbor" : 1,
+      "Ios16.conv" : 36,
+      "Ios16.add" : 144,
+      "Squeeze" : 1,
+      "Ios16.relu" : 33,
+      "Ios16.realDiv" : 192,
+      "Ios16.reduceSum" : 256,
+      "ExpandDims" : 130,
+      "Ios16.linear" : 1,
+      "Ios16.reshape" : 1
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.6.0",
+      "com.github.apple.coremltools.version" : "8.2"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 998 × 80)",
+        "shortDescription" : "",
+        "shape" : "[1, 998, 80]",
+        "name" : "preprocessor_output_1",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 64 × 589)",
+        "shortDescription" : "",
+        "shape" : "[1, 64, 589]",
+        "name" : "speaker_masks",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerEmbedding_8_bit",
+    "method" : "predict"
+  }
+]

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedder.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:14c666c28766dd780a3afc3dbb4b44078e418e16f44d97780b9f8555407213a1
+size 6661888

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1383750df1af99af002f0c3403bcf19a18c3d749706eb3498d34b0fe01abf2fc
+size 243

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc230803421bf4fe14f843ea5b5fa0035487fd19cdd69ed670d72560b6a44586
+size 330

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,77 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Float32",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 2998 × 80)",
+        "shortDescription" : "",
+        "shape" : "[1, 2998, 80]",
+        "name" : "preprocessor_output_1",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Ios16.cast" : 2,
+      "Ios16.mul" : 4,
+      "SliceByIndex" : 2,
+      "Transpose" : 2,
+      "SlidingWindows" : 1,
+      "Ios16.sub" : 3,
+      "Ios16.log" : 1,
+      "Ios16.reduceMean" : 2,
+      "Ios16.square" : 2,
+      "Squeeze" : 2,
+      "Ios16.matmul" : 2,
+      "Ios16.add" : 1,
+      "Ios16.linear" : 1,
+      "ExpandDims" : 4,
+      "Ios16.gather" : 2,
+      "Ios16.maximum" : 1,
+      "Identity" : 1,
+      "Pad" : 2
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.source" : "torch==2.6.0",
+      "com.github.apple.coremltools.version" : "8.2"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1 × 480000)",
+        "shortDescription" : "",
+        "shape" : "[1, 480000]",
+        "name" : "waveforms",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerEmbeddingPreprocessor",
+    "method" : "predict"
+  }
+]

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/model.mil ADDED Viewed

	@@ -0,0 +1,90 @@

+program(1.0)
+[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3402.3.2"}, {"coremlc-version", "3402.4.1"}, {"coremltools-component-torch", "2.6.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.2"}})]
+{
+    func main<ios16>(tensor<fp16, [1, 480000]> waveforms) {
+            tensor<string, []> cast_0_dtype_0 = const()[name = tensor<string, []>("cast_0_dtype_0"), val = tensor<string, []>("fp32")];
+            tensor<fp32, []> var_2_promoted = const()[name = tensor<string, []>("op_2_promoted"), val = tensor<fp32, []>(0x1p+15)];
+            tensor<fp32, [1, 480000]> cast_0 = cast(dtype = cast_0_dtype_0, x = waveforms)[name = tensor<string, []>("cast_11")];
+            tensor<fp32, [1, 480000]> waveform_1 = mul(x = cast_0, y = var_2_promoted)[name = tensor<string, []>("waveform_1")];
+            tensor<int32, [2]> var_6_begin_0 = const()[name = tensor<string, []>("op_6_begin_0"), val = tensor<int32, [2]>([0, 0])];
+            tensor<int32, [2]> var_6_end_0 = const()[name = tensor<string, []>("op_6_end_0"), val = tensor<int32, [2]>([1, 480000])];
+            tensor<bool, [2]> var_6_end_mask_0 = const()[name = tensor<string, []>("op_6_end_mask_0"), val = tensor<bool, [2]>([false, true])];
+            tensor<bool, [2]> var_6_squeeze_mask_0 = const()[name = tensor<string, []>("op_6_squeeze_mask_0"), val = tensor<bool, [2]>([true, false])];
+            tensor<fp32, [480000]> var_6 = slice_by_index(begin = var_6_begin_0, end = var_6_end_0, end_mask = var_6_end_mask_0, squeeze_mask = var_6_squeeze_mask_0, x = waveform_1)[name = tensor<string, []>("op_6")];
+            tensor<int32, []> sliding_windows_0_axis_0 = const()[name = tensor<string, []>("sliding_windows_0_axis_0"), val = tensor<int32, []>(0)];
+            tensor<int32, []> sliding_windows_0_size_0 = const()[name = tensor<string, []>("sliding_windows_0_size_0"), val = tensor<int32, []>(400)];
+            tensor<int32, []> sliding_windows_0_stride_0 = const()[name = tensor<string, []>("sliding_windows_0_stride_0"), val = tensor<int32, []>(160)];
+            tensor<fp32, [2998, 400]> sliding_windows_0 = sliding_windows(axis = sliding_windows_0_axis_0, size = sliding_windows_0_size_0, stride = sliding_windows_0_stride_0, x = var_6)[name = tensor<string, []>("sliding_windows_0")];
+            tensor<int32, [1]> var_42_axes_0 = const()[name = tensor<string, []>("op_42_axes_0"), val = tensor<int32, [1]>([1])];
+            tensor<bool, []> var_42_keep_dims_0 = const()[name = tensor<string, []>("op_42_keep_dims_0"), val = tensor<bool, []>(false)];
+            tensor<fp32, [2998]> var_42 = reduce_mean(axes = var_42_axes_0, keep_dims = var_42_keep_dims_0, x = sliding_windows_0)[name = tensor<string, []>("op_42")];
+            tensor<int32, [1]> row_means_axes_0 = const()[name = tensor<string, []>("row_means_axes_0"), val = tensor<int32, [1]>([1])];
+            tensor<fp32, [2998, 1]> row_means = expand_dims(axes = row_means_axes_0, x = var_42)[name = tensor<string, []>("row_means")];
+            tensor<fp32, [2998, 400]> strided_input_3 = sub(x = sliding_windows_0, y = row_means)[name = tensor<string, []>("strided_input_3")];
+            tensor<int32, [1]> input_1_axes_0 = const()[name = tensor<string, []>("input_1_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 400]> input_1 = expand_dims(axes = input_1_axes_0, x = strided_input_3)[name = tensor<string, []>("input_1")];
+            tensor<fp32, []> const_2 = const()[name = tensor<string, []>("const_2"), val = tensor<fp32, []>(0x0p+0)];
+            tensor<int32, [6]> var_54_pad_0 = const()[name = tensor<string, []>("op_54_pad_0"), val = tensor<int32, [6]>([0, 0, 0, 0, 1, 0])];
+            tensor<string, []> var_54_mode_0 = const()[name = tensor<string, []>("op_54_mode_0"), val = tensor<string, []>("replicate")];
+            tensor<fp32, [1, 2998, 401]> var_54 = pad(constant_val = const_2, mode = var_54_mode_0, pad = var_54_pad_0, x = input_1)[name = tensor<string, []>("op_54")];
+            tensor<int32, [1]> offset_strided_input_axes_0 = const()[name = tensor<string, []>("offset_strided_input_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [2998, 401]> offset_strided_input = squeeze(axes = offset_strided_input_axes_0, x = var_54)[name = tensor<string, []>("offset_strided_input")];
+            tensor<int32, [2]> var_66_begin_0 = const()[name = tensor<string, []>("op_66_begin_0"), val = tensor<int32, [2]>([0, 0])];
+            tensor<int32, [2]> var_66_end_0 = const()[name = tensor<string, []>("op_66_end_0"), val = tensor<int32, [2]>([2998, 400])];
+            tensor<bool, [2]> var_66_end_mask_0 = const()[name = tensor<string, []>("op_66_end_mask_0"), val = tensor<bool, [2]>([true, false])];
+            tensor<fp32, [2998, 400]> var_66 = slice_by_index(begin = var_66_begin_0, end = var_66_end_0, end_mask = var_66_end_mask_0, x = offset_strided_input)[name = tensor<string, []>("op_66")];
+            tensor<fp32, []> var_67 = const()[name = tensor<string, []>("op_67"), val = tensor<fp32, []>(0x1.f0a3d8p-1)];
+            tensor<fp32, [2998, 400]> var_68 = mul(x = var_66, y = var_67)[name = tensor<string, []>("op_68")];
+            tensor<fp32, [2998, 400]> strided_input_5 = sub(x = strided_input_3, y = var_68)[name = tensor<string, []>("strided_input_5")];
+            tensor<fp32, [1, 400]> window_function = const()[name = tensor<string, []>("window_function"), val = tensor<fp32, [1, 400]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
+            tensor<fp32, [2998, 400]> strided_input_7 = mul(x = strided_input_5, y = window_function)[name = tensor<string, []>("strided_input_7")];
+            tensor<int32, [1]> input_3_axes_0 = const()[name = tensor<string, []>("input_3_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 400]> input_3 = expand_dims(axes = input_3_axes_0, x = strided_input_7)[name = tensor<string, []>("input_3")];
+            tensor<fp32, []> const_3 = const()[name = tensor<string, []>("const_3"), val = tensor<fp32, []>(0x0p+0)];
+            tensor<int32, [6]> var_90_pad_0 = const()[name = tensor<string, []>("op_90_pad_0"), val = tensor<int32, [6]>([0, 0, 0, 0, 0, 112])];
+            tensor<string, []> var_90_mode_0 = const()[name = tensor<string, []>("op_90_mode_0"), val = tensor<string, []>("constant")];
+            tensor<fp32, [1, 2998, 512]> var_90 = pad(constant_val = const_3, mode = var_90_mode_0, pad = var_90_pad_0, x = input_3)[name = tensor<string, []>("op_90")];
+            tensor<int32, [1]> strided_input_axes_0 = const()[name = tensor<string, []>("strided_input_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [2998, 512]> strided_input = squeeze(axes = strided_input_axes_0, x = var_90)[name = tensor<string, []>("strided_input")];
+            tensor<fp32, [512, 512]> cos_0 = const()[name = tensor<string, []>("cos_0"), val = tensor<fp32, [512, 512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1728)))];
+            tensor<fp32, [512, 512]> sin_0 = const()[name = tensor<string, []>("sin_0"), val = tensor<fp32, [512, 512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1050368)))];
+            tensor<bool, []> matmul_1_transpose_x_1 = const()[name = tensor<string, []>("matmul_1_transpose_x_1"), val = tensor<bool, []>(false)];
+            tensor<bool, []> matmul_1_transpose_y_1 = const()[name = tensor<string, []>("matmul_1_transpose_y_1"), val = tensor<bool, []>(true)];
+            tensor<fp32, [512, 2998]> matmul_1 = matmul(transpose_x = matmul_1_transpose_x_1, transpose_y = matmul_1_transpose_y_1, x = cos_0, y = strided_input)[name = tensor<string, []>("matmul_1")];
+            tensor<bool, []> matmul_3_transpose_x_1 = const()[name = tensor<string, []>("matmul_3_transpose_x_1"), val = tensor<bool, []>(false)];
+            tensor<bool, []> matmul_3_transpose_y_1 = const()[name = tensor<string, []>("matmul_3_transpose_y_1"), val = tensor<bool, []>(true)];
+            tensor<fp32, [512, 2998]> matmul_3 = matmul(transpose_x = matmul_3_transpose_x_1, transpose_y = matmul_3_transpose_y_1, x = sin_0, y = strided_input)[name = tensor<string, []>("matmul_3")];
+            tensor<fp32, []> mul_1_y_0 = const()[name = tensor<string, []>("mul_1_y_0"), val = tensor<fp32, []>(-0x1p+0)];
+            tensor<fp32, [512, 2998]> mul_1 = mul(x = matmul_3, y = mul_1_y_0)[name = tensor<string, []>("mul_1")];
+            tensor<int32, [2]> transpose_3_perm_0 = const()[name = tensor<string, []>("transpose_3_perm_0"), val = tensor<int32, [2]>([-1, 0])];
+            tensor<int32, [2]> transpose_4_perm_0 = const()[name = tensor<string, []>("transpose_4_perm_0"), val = tensor<int32, [2]>([-1, 0])];
+            tensor<int32, [257]> range_1d_2 = const()[name = tensor<string, []>("range_1d_2"), val = tensor<int32, [257]>([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256])];
+            tensor<int32, []> gather_0_axis_0 = const()[name = tensor<string, []>("gather_0_axis_0"), val = tensor<int32, []>(-1)];
+            tensor<int32, []> gather_0_batch_dims_0 = const()[name = tensor<string, []>("gather_0_batch_dims_0"), val = tensor<int32, []>(0)];
+            tensor<fp32, [2998, 512]> transpose_3 = transpose(perm = transpose_3_perm_0, x = matmul_1)[name = tensor<string, []>("transpose_6")];
+            tensor<fp32, [2998, 257]> gather_0 = gather(axis = gather_0_axis_0, batch_dims = gather_0_batch_dims_0, indices = range_1d_2, x = transpose_3)[name = tensor<string, []>("gather_0")];
+            tensor<int32, []> gather_1_axis_0 = const()[name = tensor<string, []>("gather_1_axis_0"), val = tensor<int32, []>(-1)];
+            tensor<int32, []> gather_1_batch_dims_0 = const()[name = tensor<string, []>("gather_1_batch_dims_0"), val = tensor<int32, []>(0)];
+            tensor<fp32, [2998, 512]> transpose_4 = transpose(perm = transpose_4_perm_0, x = mul_1)[name = tensor<string, []>("transpose_5")];
+            tensor<fp32, [2998, 257]> gather_1 = gather(axis = gather_1_axis_0, batch_dims = gather_1_batch_dims_0, indices = range_1d_2, x = transpose_4)[name = tensor<string, []>("gather_1")];
+            tensor<fp32, [2998, 257]> square_0 = square(x = gather_0)[name = tensor<string, []>("square_0")];
+            tensor<fp32, [2998, 257]> square_1 = square(x = gather_1)[name = tensor<string, []>("square_1")];
+            tensor<fp32, [2998, 257]> add_1 = add(x = square_0, y = square_1)[name = tensor<string, []>("add_1")];
+            tensor<fp32, [2998, 257]> spectrum = identity(x = add_1)[name = tensor<string, []>("spectrum")];
+            tensor<fp32, [80, 257]> mel_energies_3 = const()[name = tensor<string, []>("mel_energies_3"), val = tensor<fp32, [80, 257]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2099008)))];
+            tensor<fp32, [80]> mel_energies_bias_0 = const()[name = tensor<string, []>("mel_energies_bias_0"), val = tensor<fp32, [80]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2181312)))];
+            tensor<fp32, [2998, 80]> mel_energies = linear(bias = mel_energies_bias_0, weight = mel_energies_3, x = spectrum)[name = tensor<string, []>("mel_energies")];
+            tensor<fp32, []> const_10 = const()[name = tensor<string, []>("const_10"), val = tensor<fp32, []>(0x1p-23)];
+            tensor<fp32, [2998, 80]> var_186 = maximum(x = mel_energies, y = const_10)[name = tensor<string, []>("op_186")];
+            tensor<fp32, []> filter_banks_epsilon_0 = const()[name = tensor<string, []>("filter_banks_epsilon_0"), val = tensor<fp32, []>(0x1p-149)];
+            tensor<fp32, [2998, 80]> filter_banks = log(epsilon = filter_banks_epsilon_0, x = var_186)[name = tensor<string, []>("filter_banks")];
+            tensor<int32, [1]> var_192_axes_0 = const()[name = tensor<string, []>("op_192_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<bool, []> var_192_keep_dims_0 = const()[name = tensor<string, []>("op_192_keep_dims_0"), val = tensor<bool, []>(true)];
+            tensor<fp32, [1, 80]> var_192 = reduce_mean(axes = var_192_axes_0, keep_dims = var_192_keep_dims_0, x = filter_banks)[name = tensor<string, []>("op_192")];
+            tensor<fp32, [2998, 80]> var_194 = sub(x = filter_banks, y = var_192)[name = tensor<string, []>("op_194")];
+            tensor<int32, [1]> obj_axes_0 = const()[name = tensor<string, []>("obj_axes_0"), val = tensor<int32, [1]>([0])];
+            tensor<fp32, [1, 2998, 80]> preprocessor_output_1_type_fp32 = expand_dims(axes = obj_axes_0, x = var_194)[name = tensor<string, []>("obj")];
+            tensor<string, []> cast_9_dtype_0 = const()[name = tensor<string, []>("cast_9_dtype_0"), val = tensor<string, []>("fp16")];
+            tensor<fp16, [1, 2998, 80]> preprocessor_output_1 = cast(dtype = cast_9_dtype_0, x = preprocessor_output_1_type_fp32)[name = tensor<string, []>("cast_10")];
+        } -> (preprocessor_output_1);
+}

speaker_embedder/pyannote-v3-pro/W8A16/SpeakerEmbedderPreprocessor.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f2c284bd22f1f7ab76901c1c6e57f82d4ebbf057fa0b924aad057f124f77a89
+size 2181696

speaker_segmenter/pyannote-v3-pro/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_segmenter/pyannote-v3-pro/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://huggingface.co/pyannote/segmentation-3.0/blob/main/LICENSE
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_segmenter/pyannote-v3-pro/W32A32/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_segmenter/pyannote-v3-pro/W32A32/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://huggingface.co/pyannote/segmentation-3.0/blob/main/LICENSE
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f3593627d0e4a99c4537655e8339aa5f786a175f913194781af7c6ef3b969f7
+size 243

speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d92ffe80d66daa38293970d33fef64924b89b3f8d8ee71606e1a1e03e19d200
+size 519

speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,144 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Float32",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 589, 3]",
+        "name" : "speaker_probs",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 589, 3]",
+        "name" : "speaker_ids",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 3]",
+        "name" : "speaker_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589)",
+        "shortDescription" : "",
+        "shape" : "[21, 589]",
+        "name" : "overlapped_speaker_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1767)",
+        "shortDescription" : "",
+        "shape" : "[1767]",
+        "name" : "voice_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 1 × 160000)",
+        "shortDescription" : "",
+        "shape" : "[21, 1, 160000]",
+        "name" : "sliding_window_waveform",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Transpose" : 2,
+      "Ios16.maxPool" : 3,
+      "Ios16.exp" : 1,
+      "Ios16.softmax" : 1,
+      "SlidingWindows" : 1,
+      "Ios16.linear" : 5,
+      "Ios16.add" : 40,
+      "Ios16.realDiv" : 1,
+      "Ios16.reduceMax" : 1,
+      "Ios16.reduceSum" : 2,
+      "Ios16.reduceArgmax" : 1,
+      "Ios16.greater" : 1,
+      "Ios16.log" : 1,
+      "ExpandDims" : 1,
+      "Ios16.instanceNorm" : 4,
+      "Ios16.sub" : 1,
+      "Ios16.cast" : 9,
+      "Ios16.conv" : 3,
+      "Ios16.lstm" : 4,
+      "OneHot" : 1,
+      "SliceByIndex" : 61,
+      "Ios16.abs" : 1,
+      "Ios16.scatter" : 42,
+      "Ios16.mul" : 1,
+      "Ios16.leakyRelu" : 5
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.version" : "8.2",
+      "com.github.apple.coremltools.source" : "torch==2.6.0"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 480000)",
+        "shortDescription" : "",
+        "shape" : "[480000]",
+        "name" : "waveform",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 7)",
+        "shortDescription" : "",
+        "shape" : "[7]",
+        "name" : "input_1",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerSegmenter",
+    "method" : "predict"
+  }
+]

speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

speaker_segmenter/pyannote-v3-pro/W32A32/SpeakerSegmenter.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e76cb6e08ccbc6a007135fca00179f5c72ed6b0878e1584b129614388ee6909b
+size 5990900

speaker_segmenter/pyannote-v3-pro/W8A16/LICENSE_NOTICE.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Argmax proprietary and confidential. Under NDA.
+Copyright 2025 Argmax, Inc. All rights reserved.
+Unauthorized access, copying, use, distribution, and or commercialization of this file, via any medium or means is strictly prohibited.
+Please contact Argmax for licensing information at [email protected].

speaker_segmenter/pyannote-v3-pro/W8A16/README.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+# License
+Original model weights: https://huggingface.co/pyannote/segmentation-3.0/blob/main/LICENSE
+Argmax-optimized model asset (Assets with `.mlmodelc` extension): https://huggingface.co/argmaxinc/speakerkit-pro/blob/main/LICENSE_NOTICE.txt
+Please contact [email protected] for licensing SpeakerKit Pro assets

speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/analytics/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25923d134e4f141b7e5284d06144f7b5961eb43b3a7027495bb54e322706570b
+size 243

speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/coremldata.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d92ffe80d66daa38293970d33fef64924b89b3f8d8ee71606e1a1e03e19d200
+size 519

speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/metadata.json ADDED Viewed

	@@ -0,0 +1,145 @@

+[
+  {
+    "metadataOutputVersion" : "3.0",
+    "storagePrecision" : "Mixed (Float16, Float32, Palettized (8 bits))",
+    "outputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 589, 3]",
+        "name" : "speaker_probs",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 589, 3]",
+        "name" : "speaker_ids",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 3)",
+        "shortDescription" : "",
+        "shape" : "[21, 3]",
+        "name" : "speaker_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 589)",
+        "shortDescription" : "",
+        "shape" : "[21, 589]",
+        "name" : "overlapped_speaker_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 1767)",
+        "shortDescription" : "",
+        "shape" : "[1767]",
+        "name" : "voice_activity",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 21 × 1 × 160000)",
+        "shortDescription" : "",
+        "shape" : "[21, 1, 160000]",
+        "name" : "sliding_window_waveform",
+        "type" : "MultiArray"
+      }
+    ],
+    "modelParameters" : [
+    ],
+    "specificationVersion" : 7,
+    "mlProgramOperationTypeHistogram" : {
+      "Transpose" : 2,
+      "Ios16.maxPool" : 3,
+      "Ios16.exp" : 1,
+      "Ios16.softmax" : 1,
+      "SlidingWindows" : 1,
+      "Ios16.linear" : 5,
+      "Ios16.add" : 40,
+      "Ios16.realDiv" : 1,
+      "Ios16.reduceMax" : 1,
+      "Ios16.reduceSum" : 2,
+      "Ios16.reduceArgmax" : 1,
+      "Ios16.greater" : 1,
+      "Ios16.log" : 1,
+      "ExpandDims" : 1,
+      "Ios16.instanceNorm" : 4,
+      "Ios16.sub" : 1,
+      "Ios16.cast" : 4,
+      "Ios16.conv" : 3,
+      "Ios16.constexprLutToDense" : 22,
+      "OneHot" : 1,
+      "Ios16.abs" : 1,
+      "Ios16.lstm" : 4,
+      "SliceByIndex" : 61,
+      "Ios16.scatter" : 42,
+      "Ios16.mul" : 1,
+      "Ios16.leakyRelu" : 5
+    },
+    "computePrecision" : "Mixed (Float16, Float32, Int32)",
+    "isUpdatable" : "0",
+    "stateSchema" : [
+    ],
+    "availability" : {
+      "macOS" : "13.0",
+      "tvOS" : "16.0",
+      "visionOS" : "1.0",
+      "watchOS" : "9.0",
+      "iOS" : "16.0",
+      "macCatalyst" : "16.0"
+    },
+    "modelType" : {
+      "name" : "MLModelType_mlProgram"
+    },
+    "userDefinedMetadata" : {
+      "com.github.apple.coremltools.source_dialect" : "TorchScript",
+      "com.github.apple.coremltools.version" : "8.2",
+      "com.github.apple.coremltools.source" : "torch==2.6.0"
+    },
+    "inputSchema" : [
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 480000)",
+        "shortDescription" : "",
+        "shape" : "[480000]",
+        "name" : "waveform",
+        "type" : "MultiArray"
+      },
+      {
+        "hasShapeFlexibility" : "0",
+        "isOptional" : "0",
+        "dataType" : "Float16",
+        "formattedType" : "MultiArray (Float16 7)",
+        "shortDescription" : "",
+        "shape" : "[7]",
+        "name" : "input_1",
+        "type" : "MultiArray"
+      }
+    ],
+    "generatedClassName" : "SpeakerSegmenter_8_bit",
+    "method" : "predict"
+  }
+]

speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/model.mil ADDED Viewed

The diff for this file is too large to render. See raw diff

speaker_segmenter/pyannote-v3-pro/W8A16/SpeakerSegmenter.mlmodelc/weights/weight.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:18aa76153cdb04fc74b8b3ab438d96d0f297aba084f4ebc7ea2b7dcc611c1838
+size 1537882