Refactor stack method in tensor for performance

CodeWithKyrian · CodeWithKyrian · commit 32d8cfd04d6b · 2024-05-01T10:17:20.000+01:00
diff --git a/src/FeatureExtractors/ImageFeatureExtractor.php b/src/FeatureExtractors/ImageFeatureExtractor.php
@@ -201,9 +201,7 @@ public function padImage(
         int       $constantValues = 0
     ): array
     {
-        $imageHeight = $imgShape[0];
-        $imageWidth = $imgShape[1];
-        $imageChannels = $imgShape[2];
+        [$imageHeight, $imageWidth, $imageChannels] = $imgShape;
 
         if (is_array($padSize)) {
             $paddedImageWidth = $padSize['width'];
@@ -459,7 +457,6 @@ public function preprocess(
 
         $imgShape = [$image->height(), $image->width(), $image->channels];
 
-
         if ($this->doRescale) {
             $this->rescale($pixelData);
         }
@@ -529,21 +526,12 @@ public function __invoke(Image|array $images, ...$args): array
             $imageData[] = $this->preprocess($image);
         }
 
-        // Stack pixel values
-        $pixelValues = [];
-        foreach ($imageData as $data) {
-            $pixelValues[] = $data['pixel_values'];
-        }
+        $pixelValues = array_column($imageData, 'pixel_values');
+        $originalSizes = array_column($imageData, 'original_size');
+        $reshapedInputSizes = array_column($imageData, 'reshaped_input_size');
 
         $stackedPixelValues = Tensor::stack($pixelValues, 0);
 
-        // Prepare metadata
-        $originalSizes = [];
-        $reshapedInputSizes = [];
-        foreach ($imageData as $data) {
-            $originalSizes[] = $data['original_size'];
-            $reshapedInputSizes[] = $data['reshaped_input_size'];
-        }
         return [
             'pixel_values' => $stackedPixelValues,
             'original_sizes' => $originalSizes,
diff --git a/src/Generation/Samplers/Sampler.php b/src/Generation/Samplers/Sampler.php
@@ -57,14 +57,11 @@ public function getLogits(Tensor $logits, int $index): Tensor
 //            $logs = array_slice($logs, $startIndex, $startIndex + $vocabSize);
 //        }
 
-        $start = array_fill(0, $logits->ndim() - 2, 0);
-        $size = array_fill(0, $logits->ndim() - 2, 1);
+        $start = array_fill(0, $logits->ndim(), 0);
+        $size = array_fill(0, $logits->ndim(), 1);
 
-        $start[] = $index;
-        $size[] = 1;
-
-        $start[] = -$vocabSize;
-        $size[] = $vocabSize;
+        array_splice($start, -2, replacement: [$index, 0]);
+        array_splice($size, -2, replacement: [1, $vocabSize]);
 
         $logs = $logits->newSlice($start, $size);
 
diff --git a/src/Models/Pretrained/PretrainedModel.php b/src/Models/Pretrained/PretrainedModel.php
@@ -625,7 +625,7 @@ public function generate(
                 // In most cases, this will be [batch_size, 1, vocab_size]
                 // So, we select the last token's logits:
                 // (equivalent to `logits = outputs.logits[:, -1, :]`)
-                $logits = $output['logits']-lice(null, -1, null);
+                $logits = $output['logits']->slice(null, -1, null);
 
                 // Apply logits processor
                 $logitsProcessor($beam['output_token_ids'], $logits);
diff --git a/src/Pipelines/ImageClassificationPipeline.php b/src/Pipelines/ImageClassificationPipeline.php
@@ -62,7 +62,6 @@ public function __invoke(array|string $inputs, ...$args): array
 
         ['pixel_values' => $pixelValues] = ($this->processor)($preparedImages);
 
-
         /** @var SequenceClassifierOutput $output */
         $output = $this->model->__invoke(['pixel_values' => $pixelValues]);
 
@@ -86,6 +85,7 @@ public function __invoke(array|string $inputs, ...$args): array
                 $toReturn[] = $values;
             }
         }
+
         if ($isBatched || $topK === 1) {
             return $toReturn;
         } else {
diff --git a/src/Pipelines/ZeroShotImageClassificationPipeline.php b/src/Pipelines/ZeroShotImageClassificationPipeline.php
@@ -51,7 +51,7 @@ public function __invoke(array|string $inputs, ...$args): array
         $output = $this->model->__invoke(array_merge($textInputs, ['pixel_values' => $pixelValues]));
 
         $activationFn = $this->model->config['model_type'] === 'siglip' ?
-            fn(Tensor $batch) => $batch->sigmoid()->toArray() :
+            fn(Tensor $batch) => $batch->sigmoid():
             fn(Tensor $batch) => $batch->softmax();
 
         // Compare each image with each candidate label
diff --git a/src/Utils/Tensor.php b/src/Utils/Tensor.php
@@ -459,9 +459,11 @@ public static function zerosLike(Tensor $other): static
      */
     public static function stack(array $tensors, int $axis = 0): Tensor
     {
-        // TODO: Perform validation of shapes
-        // NOTE: stack expects each tensor to be equal size
-        return self::cat(array_map(fn($t) => $t->unsqueeze($axis), $tensors), $axis);
+        $mo = self::mo();
+
+        $stacked = $mo->la()->stack($tensors, $axis);
+
+        return new Tensor($stacked->buffer(), $stacked->dtype(), $stacked->shape(), $stacked->offset());
     }
 
     /**
@@ -473,58 +475,13 @@ public static function stack(array $tensors, int $axis = 0): Tensor
      * @return Tensor The concatenated tensor.
      * @throws Exception
      */
-    public static function cat(array $tensors, int $axis = 0): Tensor
+    public static function concat(array $tensors, int $axis = 0): Tensor
     {
-        $axis = self::safeIndex($axis, $tensors[0]->ndim());
-
-        // TODO: Perform validation of shapes
-
-        $resultShape = $tensors[0]->shape();
-        $resultOffset = $tensors[0]->offset();
-        $resultType = $tensors[0]->dtype();
-        $resultShape[$axis] = array_reduce($tensors, fn($carry, $tensor) => $carry + $tensor->shape()[$axis], 0);
-
-        // Create a new array to store the accumulated values
-        $resultSize = array_product($resultShape);
-
-        $result = self::newBuffer($resultSize, $resultType);
-
-        // Create output tensor of same type as first
-
-        if ($axis === 0) {
-            // Handle special case for performance reasons
-
-            $offset = 0;
-            foreach ($tensors as $t) {
-                for ($i = 0; $i < $t->buffer->count(); $i++) {
-                    $result[$offset++] = $t->buffer()[$i];
-                }
-            }
-        } else {
-            $currentShape = 0;
-
-            foreach ($tensors as $tensor) {
-                for ($i = 0; $i < $tensor->buffer->count(); $i++) {
-                    $resultIndex = 0;
-
-                    for ($j = $tensor->ndim() - 1, $num = $i, $resultMultiplier = 1; $j >= 0; --$j) {
-                        $size = $tensor->shape()[$j];
-                        $index = $num % $size;
-                        if ($j === $axis) {
-                            $index += $currentShape;
-                        }
-                        $resultIndex += $index * $resultMultiplier;
-                        $resultMultiplier *= $resultShape[$j];
-                        $num = (int)floor($num / $size);
-                    }
-                    $result[$resultIndex] = $tensor->buffer()[$i];
-                }
+        $mo = self::mo();
 
-                $currentShape += $tensor->shape()[$axis];
-            }
-        }
+        $ndArray = $mo->la()->concat($tensors, $axis);
 
-        return new Tensor($result, $resultType, $resultShape, $resultOffset);
+        return new static($ndArray->buffer(), $ndArray->dtype(), $ndArray->shape(), $ndArray->offset());
     }
 
     /**
@@ -577,31 +534,16 @@ public function squeeze(?int $axis = null): static
      */
     public function unsqueeze(?int $axis = null): static
     {
-        return new Tensor(
-            $this->buffer(),
-            $this->dtype,
-            $this->calcUnsqueezeShape($this->shape(), $axis),
-            $this->offset
-        );
-    }
+        $shape = $this->shape();
 
-    /**
-     * Helper function to calculate new shape when performing an unsqueeze operation.
-     * @param array $shape The shape of the tensor.
-     * @param int $axis The axis to unsqueeze.
-     * @return array The new shape.
-     */
-    protected function calcUnsqueezeShape(array $shape, int $axis): array
-    {
-        // Dimension out of range (e.g., "expected to be in range of [-4, 3], but got 4")
-        // + 1 since we allow inserting at the end (i.e. $axis = -1)
         $axis = self::safeIndex($axis, count($shape) + 1);
 
         array_splice($shape, $axis, 0, 1);
 
-        return $shape;
+        return new Tensor($this->buffer(), $this->dtype, $shape, $this->offset);
     }
 
+
     /**
      * Add a tensor or scalar to this tensor. If it's a tensor, it must be the same shape, and it performs
      * an element-wise addition. If it's a scalar, it adds the scalar to every element in the tensor.

Original file line number	Diff line number	Diff line change
`@@ -62,7 +62,6 @@ public function __invoke(array\|string $inputs, ...$args): array`
`62`	`62`
`63`	`63`	`['pixel_values' => $pixelValues] = ($this->processor)($preparedImages);`
`64`	`64`
`65`		`-`
`66`	`65`	`/** @var SequenceClassifierOutput $output */`
`67`	`66`	`$output = $this->model->__invoke(['pixel_values' => $pixelValues]);`
`68`	`67`
`@@ -86,6 +85,7 @@ public function __invoke(array\|string $inputs, ...$args): array`
`86`	`85`	`$toReturn[] = $values;`
`87`	`86`	`}`
`88`	`87`	`}`
	`88`	`+`
`89`	`89`	`if ($isBatched \|\| $topK === 1) {`
`90`	`90`	`return $toReturn;`
`91`	`91`	`} else {`