optim flatten().shape[0] is numel (#10935)

2026-06-24 02:14:17 +00:00 · 2025-06-23 13:11:19 -04:00 · 2025-06-23 13:11:19 -04:00 · 785b4ea8ac
commit 785b4ea8ac
parent ac39f27ae6
1 changed files with 1 additions and 1 deletions
--- a/tinygrad/nn/optim.py
+++ b/tinygrad/nn/optim.py
@ -21,7 +21,7 @@ class Optimizer:
    # store lr in at least float32 precision
    self.lr = Tensor(lr if getenv("CONST_LR") else [lr], requires_grad=False, device=self.device,
                     dtype=least_upper_dtype(dtypes.default_float, dtypes.float32))
-    if self.fused: self.pos_params = list(itertools.accumulate(self.params, lambda x,y: x+y.flatten().shape[0], initial=0))
+    if self.fused: self.pos_params = list(itertools.accumulate(self.params, lambda x,y: x+y.numel(), initial=0))

  def _new_optim_param(self) -> list[Tensor]:
    param_dtype = getenv("OPTIM_DTYPE", "float32")