tracel-ai
diff --git a/‎burn-book/src/building-blocks/tensor.md
Lines changed: 35 additions & 34 deletions b/‎burn-book/src/building-blocks/tensor.md
Lines changed: 35 additions & 34 deletions
diff --git a/‎crates/burn-autodiff/src/ops/bool_tensor.rs
Lines changed: 2 additions & 2 deletions b/‎crates/burn-autodiff/src/ops/bool_tensor.rs
Lines changed: 2 additions & 2 deletions
diff --git a/‎crates/burn-autodiff/src/ops/int_tensor.rs
Lines changed: 2 additions & 2 deletions b/‎crates/burn-autodiff/src/ops/int_tensor.rs
Lines changed: 2 additions & 2 deletions
diff --git a/‎crates/burn-autodiff/src/ops/tensor.rs
Lines changed: 6 additions & 4 deletions b/‎crates/burn-autodiff/src/ops/tensor.rs
Lines changed: 6 additions & 4 deletions
diff --git a/‎crates/burn-autodiff/src/tests/mod.rs
Lines changed: 2 additions & 2 deletions b/‎crates/burn-autodiff/src/tests/mod.rs
Lines changed: 2 additions & 2 deletions
diff --git a/‎crates/burn-autodiff/src/tests/repeat.rs renamed to ‎crates/burn-autodiff/src/tests/repeat_dim.rs
Lines changed: 2 additions & 2 deletions b/‎crates/burn-autodiff/src/tests/repeat.rs renamed to ‎crates/burn-autodiff/src/tests/repeat_dim.rs
Lines changed: 2 additions & 2 deletions
diff --git a/‎crates/burn-candle/src/lib.rs
Lines changed: 1 addition & 1 deletion b/‎crates/burn-candle/src/lib.rs
Lines changed: 1 addition & 1 deletion
diff --git a/‎crates/burn-core/src/nn/attention/mask.rs
Lines changed: 1 addition & 1 deletion b/‎crates/burn-core/src/nn/attention/mask.rs
Lines changed: 1 addition & 1 deletion
diff --git a/‎crates/burn-core/src/nn/loss/cross_entropy.rs
Lines changed: 3 additions & 3 deletions b/‎crates/burn-core/src/nn/loss/cross_entropy.rs
Lines changed: 3 additions & 3 deletions
diff --git a/‎crates/burn-core/src/nn/rope_encoding.rs
Lines changed: 2 additions & 2 deletions b/‎crates/burn-core/src/nn/rope_encoding.rs
Lines changed: 2 additions & 2 deletions
@@ -131,40 +131,41 @@ for the sake of simplicity, we ignore type signatures. For more details, refer t
 
 Those operations are available for all tensor kinds: `Int`, `Float`, and `Bool`.
 
-| Burn                                  | PyTorch Equivalent                   |
-| ------------------------------------- | ------------------------------------ |
-| `Tensor::cat(tensors, dim)`           | `torch.cat(tensors, dim)`            |
-| `Tensor::empty(shape, device)`        | `torch.empty(shape, device=device)`  |
-| `Tensor::from_primitive(primitive)`   | N/A                                  |
-| `Tensor::stack(tensors, dim)`         | `torch.stack(tensors, dim)`          |
-| `tensor.all()`                        | `tensor.all()`                       |
-| `tensor.all_dim(dim)`                 | `tensor.all(dim)`                    |
-| `tensor.any()`                        | `tensor.any()`                       |
-| `tensor.any_dim(dim)`                 | `tensor.any(dim)`                    |
-| `tensor.chunk(num_chunks, dim)`       | `tensor.chunk(num_chunks, dim)`      |
-| `tensor.device()`                     | `tensor.device`                      |
-| `tensor.dims()`                       | `tensor.size()`                      |
-| `tensor.equal(other)`                 | `x == y`                             |
-| `tensor.expand(shape)`                | `tensor.expand(shape)`               |
-| `tensor.flatten(start_dim, end_dim)`  | `tensor.flatten(start_dim, end_dim)` |
-| `tensor.flip(axes)`                   | `tensor.flip(axes)`                  |
-| `tensor.into_data()`                  | N/A                                  |
-| `tensor.into_primitive()`             | N/A                                  |
-| `tensor.into_scalar()`                | `tensor.item()`                      |
-| `tensor.narrow(dim, start, length)`   | `tensor.narrow(dim, start, length)`  |
-| `tensor.not_equal(other)`             | `x != y`                             |
-| `tensor.permute(axes)`                | `tensor.permute(axes)`               |
-| `tensor.movedim(src, dst)`            | `tensor.movedim(src, dst)`           |
-| `tensor.repeat(2, 4)`                 | `tensor.repeat([1, 1, 4])`           |
-| `tensor.reshape(shape)`               | `tensor.view(shape)`                 |
-| `tensor.shape()`                      | `tensor.shape`                       |
-| `tensor.slice(ranges)`                | `tensor[(*ranges,)]`                 |
-| `tensor.slice_assign(ranges, values)` | `tensor[(*ranges,)] = values`        |
-| `tensor.squeeze(dim)`                 | `tensor.squeeze(dim)`                |
-| `tensor.to_data()`                    | N/A                                  |
-| `tensor.to_device(device)`            | `tensor.to(device)`                  |
-| `tensor.unsqueeze()`                  | `tensor.unsqueeze(0)`                |
-| `tensor.unsqueeze_dim(dim)`           | `tensor.unsqueeze(dim)`              |
+| Burn                                  | PyTorch Equivalent                                                       |
+| ------------------------------------- | ------------------------------------------------------------------------ |
+| `Tensor::cat(tensors, dim)`           | `torch.cat(tensors, dim)`                                                |
+| `Tensor::empty(shape, device)`        | `torch.empty(shape, device=device)`                                      |
+| `Tensor::from_primitive(primitive)`   | N/A                                                                      |
+| `Tensor::stack(tensors, dim)`         | `torch.stack(tensors, dim)`                                              |
+| `tensor.all()`                        | `tensor.all()`                                                           |
+| `tensor.all_dim(dim)`                 | `tensor.all(dim)`                                                        |
+| `tensor.any()`                        | `tensor.any()`                                                           |
+| `tensor.any_dim(dim)`                 | `tensor.any(dim)`                                                        |
+| `tensor.chunk(num_chunks, dim)`       | `tensor.chunk(num_chunks, dim)`                                          |
+| `tensor.device()`                     | `tensor.device`                                                          |
+| `tensor.dims()`                       | `tensor.size()`                                                          |
+| `tensor.equal(other)`                 | `x == y`                                                                 |
+| `tensor.expand(shape)`                | `tensor.expand(shape)`                                                   |
+| `tensor.flatten(start_dim, end_dim)`  | `tensor.flatten(start_dim, end_dim)`                                     |
+| `tensor.flip(axes)`                   | `tensor.flip(axes)`                                                      |
+| `tensor.into_data()`                  | N/A                                                                      |
+| `tensor.into_primitive()`             | N/A                                                                      |
+| `tensor.into_scalar()`                | `tensor.item()`                                                          |
+| `tensor.narrow(dim, start, length)`   | `tensor.narrow(dim, start, length)`                                      |
+| `tensor.not_equal(other)`             | `x != y`                                                                 |
+| `tensor.permute(axes)`                | `tensor.permute(axes)`                                                   |
+| `tensor.movedim(src, dst)`            | `tensor.movedim(src, dst)`                                               |
+| `tensor.repeat_dim(dim, times)`       | `tensor.repeat(*[times if i == dim else 1 for i in range(tensor.dim())])`|
+| `tensor.repeat(sizes)`                | `tensor.repeat(sizes)`                                                   |
+| `tensor.reshape(shape)`               | `tensor.view(shape)`                                                     |
+| `tensor.shape()`                      | `tensor.shape`                                                           |
+| `tensor.slice(ranges)`                | `tensor[(*ranges,)]`                                                     |
+| `tensor.slice_assign(ranges, values)` | `tensor[(*ranges,)] = values`                                            |
+| `tensor.squeeze(dim)`                 | `tensor.squeeze(dim)`                                                    |
+| `tensor.to_data()`                    | N/A                                                                      |
+| `tensor.to_device(device)`            | `tensor.to(device)`                                                      |
+| `tensor.unsqueeze()`                  | `tensor.unsqueeze(0)`                                                    |
+| `tensor.unsqueeze_dim(dim)`           | `tensor.unsqueeze(dim)`                                                  |
 
 ### Numeric Operations
 
 
@@ -132,11 +132,11 @@ impl<B: Backend, C: CheckpointStrategy> BoolTensorOps<Self> for Autodiff<B, C> {
         B::bool_expand(tensor, shape)
     }
 
-    fn bool_repeat<const D: usize>(
+    fn bool_repeat_dim<const D: usize>(
         tensor: BoolTensor<B, D>,
         dim: usize,
         times: usize,
     ) -> BoolTensor<B, D> {
-        B::bool_repeat(tensor, dim, times)
+        B::bool_repeat_dim(tensor, dim, times)
     }
 }
@@ -162,12 +162,12 @@ impl<B: Backend, C: CheckpointStrategy> IntTensorOps<Self> for Autodiff<B, C> {
         B::int_mean_dim(tensor, dim)
     }
 
-    fn int_repeat<const D: usize>(
+    fn int_repeat_dim<const D: usize>(
         tensor: IntTensor<B, D>,
         dim: usize,
         times: usize,
     ) -> IntTensor<B, D> {
-        B::int_repeat(tensor, dim, times)
+        B::int_repeat_dim(tensor, dim, times)
     }
 
     fn int_greater<const D: usize>(lhs: IntTensor<B, D>, rhs: IntTensor<B, D>) -> BoolTensor<B, D> {
 
@@ -2418,7 +2418,7 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>
         B::float_argsort(tensor.primitive, dim, descending)
     }
 
-    fn float_repeat<const D: usize>(
+    fn float_repeat_dim<const D: usize>(
         tensor: FloatTensor<Self, D>,
         dim: usize,
         times: usize,
@@ -2437,7 +2437,7 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>
         impl<B: Backend, const D: usize> RetroForward for RetroRepeat<B, D> {
             fn forward(&self, states: &mut BackwardStates, out_node: NodeID) {
                 let tensor = states.get_state::<B::FloatTensorPrimitive<D>>(&self.tensor_id);
-                let out = B::float_repeat(tensor, self.dim, self.times);
+                let out = B::float_repeat_dim(tensor, self.dim, self.times);
                 states.save(out_node, out)
             }
         }
@@ -2467,9 +2467,11 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>
             .stateful()
         {
             OpsKind::Tracked(prep) => {
-                prep.finish(dim, B::float_repeat(tensor.primitive, dim, times))
+                prep.finish(dim, B::float_repeat_dim(tensor.primitive, dim, times))
+            }
+            OpsKind::UnTracked(prep) => {
+                prep.finish(B::float_repeat_dim(tensor.primitive, dim, times))
             }
-            OpsKind::UnTracked(prep) => prep.finish(B::float_repeat(tensor.primitive, dim, times)),
         }
     }
 
 
@@ -47,7 +47,7 @@ mod permute;
 mod pow;
 mod recip;
 mod relu;
-mod repeat;
+mod repeat_dim;
 mod reshape;
 mod select;
 mod sigmoid;
@@ -133,6 +133,6 @@ macro_rules! testgen_all {
         burn_autodiff::testgen_ad_sign!();
         burn_autodiff::testgen_ad_expand!();
         burn_autodiff::testgen_ad_sort!();
-        burn_autodiff::testgen_ad_repeat!();
+        burn_autodiff::testgen_ad_repeat_dim!();
     };
 }
@@ -1,4 +1,4 @@
-#[burn_tensor_testgen::testgen(ad_repeat)]
+#[burn_tensor_testgen::testgen(ad_repeat_dim)]
 mod tests {
     use super::*;
     use burn_tensor::{activation, TensorData};
@@ -12,7 +12,7 @@ mod tests {
         let tensor_1 = TestAutodiffTensor::<2>::from_data(data_1, &device).require_grad();
         let tensor_2 = TestAutodiffTensor::from_data(data_2, &device).require_grad();
 
-        let tensor_3 = tensor_2.clone().repeat(1, 3);
+        let tensor_3 = tensor_2.clone().repeat_dim(1, 3);
 
         let tensor_3 = tensor_1.matmul(tensor_3);
         let grads = tensor_3.backward();
 
@@ -94,7 +94,7 @@ mod tests {
     // burn_tensor::testgen_powf!();
 
     burn_tensor::testgen_random!();
-    burn_tensor::testgen_repeat!();
+    burn_tensor::testgen_repeat_dim!();
     burn_tensor::testgen_reshape!();
     burn_tensor::testgen_select!();
     burn_tensor::testgen_sin!();
 
@@ -19,7 +19,7 @@ pub fn generate_autoregressive_mask<B: Backend>(
         mask = mask.slice_assign([0..1, i..i + 1, i + 1..seq_length], values);
     }
 
-    mask = mask.repeat(0, batch_size);
+    mask = mask.repeat_dim(0, batch_size);
 
     mask.equal_elem(1_i64.elem::<i64>())
 }
 
@@ -152,7 +152,7 @@ impl<B: Backend> CrossEntropyLoss<B> {
                     * weights
                         .clone()
                         .reshape([1, nr_classes])
-                        .repeat(0, batch_size);
+                        .repeat_dim(0, batch_size);
                 let weights = weights.clone().gather(0, targets);
                 let tensor = Self::apply_mask_2d(tensor, mask);
                 tensor.sum().neg() / weights.sum()
@@ -224,7 +224,7 @@ impl<B: Backend> CrossEntropyLoss<B> {
     fn apply_mask_2d(mut tensor: Tensor<B, 2>, mask: Option<Tensor<B, 1, Bool>>) -> Tensor<B, 2> {
         if let Some(mask) = mask {
             let [batch_size, nr_classes] = tensor.dims();
-            tensor = tensor.mask_fill(mask.reshape([batch_size, 1]).repeat(1, nr_classes), 0);
+            tensor = tensor.mask_fill(mask.reshape([batch_size, 1]).repeat_dim(1, nr_classes), 0);
         }
 
         tensor
@@ -312,7 +312,7 @@ mod tests {
             * targets_logits
             * Tensor::<TestBackend, 1>::from_floats(weights.as_slice(), &device)
                 .unsqueeze()
-                .repeat(0, 4);
+                .repeat_dim(0, 4);
         let loss_2 = loss_2.sum().neg() / (1. + 2. + 3. + 5.);
         loss_1.into_data().assert_approx_eq(&loss_2.into_data(), 3);
     }
 
@@ -58,7 +58,7 @@ impl RotaryEncodingConfig {
                 .float()
                 .unsqueeze()
                 .transpose()
-                .repeat(1, self.d_model / 2)
+                .repeat_dim(1, self.d_model / 2)
                 * theta_i.unsqueeze();
 
         // Convert frequency values to complex numbers (polar form)
@@ -71,7 +71,7 @@ impl RotaryEncodingConfig {
             .reshape([self.max_sequence_length, 2, self.d_model / 2])
             .transpose()
             .unsqueeze_dim::<4>(2)
-            .repeat(2, 2)
+            .repeat_dim(2, 2)
             .reshape([self.max_sequence_length, self.d_model, 2]);
 
         RotaryEncoding {
Original file line number	Diff line number	Diff line change
`@@ -132,11 +132,11 @@ impl<B: Backend, C: CheckpointStrategy> BoolTensorOps<Self> for Autodiff<B, C> {`
`132`	`132`	`B::bool_expand(tensor, shape)`
`133`	`133`	`}`
`134`	`134`
`135`		`- fn bool_repeat<const D: usize>(`
	`135`	`+ fn bool_repeat_dim<const D: usize>(`
`136`	`136`	`tensor: BoolTensor<B, D>,`
`137`	`137`	`dim: usize,`
`138`	`138`	`times: usize,`
`139`	`139`	`) -> BoolTensor<B, D> {`
`140`		`- B::bool_repeat(tensor, dim, times)`
	`140`	`+ B::bool_repeat_dim(tensor, dim, times)`
`141`	`141`	`}`
`142`	`142`	`}`
Original file line number	Diff line number	Diff line change
`@@ -162,12 +162,12 @@ impl<B: Backend, C: CheckpointStrategy> IntTensorOps<Self> for Autodiff<B, C> {`
`162`	`162`	`B::int_mean_dim(tensor, dim)`
`163`	`163`	`}`
`164`	`164`
`165`		`- fn int_repeat<const D: usize>(`
	`165`	`+ fn int_repeat_dim<const D: usize>(`
`166`	`166`	`tensor: IntTensor<B, D>,`
`167`	`167`	`dim: usize,`
`168`	`168`	`times: usize,`
`169`	`169`	`) -> IntTensor<B, D> {`
`170`		`- B::int_repeat(tensor, dim, times)`
	`170`	`+ B::int_repeat_dim(tensor, dim, times)`
`171`	`171`	`}`
`172`	`172`
`173`	`173`	`fn int_greater<const D: usize>(lhs: IntTensor<B, D>, rhs: IntTensor<B, D>) -> BoolTensor<B, D> {`
Original file line number	Diff line number	Diff line change
`@@ -2418,7 +2418,7 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>`
`2418`	`2418`	`B::float_argsort(tensor.primitive, dim, descending)`
`2419`	`2419`	`}`
`2420`	`2420`
`2421`		`- fn float_repeat<const D: usize>(`
	`2421`	`+ fn float_repeat_dim<const D: usize>(`
`2422`	`2422`	`tensor: FloatTensor<Self, D>,`
`2423`	`2423`	`dim: usize,`
`2424`	`2424`	`times: usize,`
`@@ -2437,7 +2437,7 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>`
`2437`	`2437`	`impl<B: Backend, const D: usize> RetroForward for RetroRepeat<B, D> {`
`2438`	`2438`	`fn forward(&self, states: &mut BackwardStates, out_node: NodeID) {`
`2439`	`2439`	`let tensor = states.get_state::<B::FloatTensorPrimitive<D>>(&self.tensor_id);`
`2440`		`- let out = B::float_repeat(tensor, self.dim, self.times);`
	`2440`	`+ let out = B::float_repeat_dim(tensor, self.dim, self.times);`
`2441`	`2441`	`states.save(out_node, out)`
`2442`	`2442`	`}`
`2443`	`2443`	`}`
`@@ -2467,9 +2467,11 @@ impl<B: Backend, C: CheckpointStrategy> FloatTensorOps<Self> for Autodiff<B, C>`
`2467`	`2467`	`.stateful()`
`2468`	`2468`	`{`
`2469`	`2469`	`OpsKind::Tracked(prep) => {`
`2470`		`- prep.finish(dim, B::float_repeat(tensor.primitive, dim, times))`
	`2470`	`+ prep.finish(dim, B::float_repeat_dim(tensor.primitive, dim, times))`
	`2471`	`+ }`
	`2472`	`+ OpsKind::UnTracked(prep) => {`
	`2473`	`+ prep.finish(B::float_repeat_dim(tensor.primitive, dim, times))`
`2471`	`2474`	`}`
`2472`		`- OpsKind::UnTracked(prep) => prep.finish(B::float_repeat(tensor.primitive, dim, times)),`
`2473`	`2475`	`}`
`2474`	`2476`	`}`
`2475`	`2477`
Original file line number	Diff line number	Diff line change
`@@ -19,7 +19,7 @@ pub fn generate_autoregressive_mask<B: Backend>(`
`19`	`19`	`mask = mask.slice_assign([0..1, i..i + 1, i + 1..seq_length], values);`
`20`	`20`	`}`
`21`	`21`
`22`		`- mask = mask.repeat(0, batch_size);`
	`22`	`+ mask = mask.repeat_dim(0, batch_size);`
`23`	`23`
`24`	`24`	`mask.equal_elem(1_i64.elem::<i64>())`
`25`	`25`	`}`