Fix TensorAlloc copy that was copying the ptr

Squeletton TensorGpu that init
Added TensorStatic and Alloc to lib.zig
2026-05-27 21:15:58 +02:00 · 2026-05-26 23:34:53 +02:00 · 2026-05-26 20:06:36 +02:00 · 2026-05-26 20:01:04 +02:00 · 2026-05-25 22:52:27 +02:00 · 2026-05-25 18:18:35 +02:00
20 changed files with 4423 additions and 1224 deletions
--- a/.gitea/workflows/deploy.yml
+++ b/.gitea/workflows/deploy.yml
@ -1,34 +0,0 @@
-name: Deploy MkDocs to Garage
-on:
-  push:
-    branches:
-      - main  # Adjust to your branch name
-
-jobs:
-  build-and-deploy:
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v4
-        with:
-          python-version: '3.x'
-
-      - name: Install dependencies
-        run: pip install mkdocs-material
-
-      - name: Build
-        run: mkdocs build
-
-      - name: Sync to Garage S3
-        uses: https://github.com/jakejarvis/s3-sync-action@master
-        with:
-          args: --endpoint-url https://s3.garage.bouvais.lu --acl public-read --delete
-        env:
-          AWS_S3_BUCKET: 'zig-dimal.bouvais.lu'
-          AWS_ACCESS_KEY_ID: ${{ secrets.GARAGE_ACCESS_KEY }}
-          AWS_SECRET_ACCESS_KEY: ${{ secrets.GARAGE_SECRET_KEY }}
-          AWS_REGION: 'garage' 
-          SOURCE_DIR: 'site' # MkDocs defaults to 'site' folder for output
--- a/.gitignore
+++ b/.gitignore
@ -1,2 +1,4 @@
 zig-out
 .zig-cache
+mkdocs.yaml
+zig-pkg
--- a/build.zig
+++ b/build.zig
@ -2,22 +2,29 @@ const std = @import("std");

 pub fn build(b: *std.Build) void {
    const target = b.standardTargetOptions(.{});
-    const optimize = b.standardOptimizeOption(.{ .preferred_optimize_mode = .ReleaseFast });
+    const optimize = b.standardOptimizeOption(.{});
+
+    const zig_wgpu = b.dependency("zig_wgpu", .{
+        .target = target,
+        .optimize = optimize,
+    });

    // 1. Define the module so other projects can import it
-    _ = b.addModule("dimal", .{
-        .root_source_file = b.path("src/main.zig"),
+    const mod = b.addModule("dimal", .{
+        .root_source_file = b.path("src/lib.zig"),
    });
+    mod.addImport("gpu", zig_wgpu.module("zig-wgpu"));

    const exe_tests = b.addTest(.{
        .root_module = b.createModule(.{
-            .root_source_file = b.path("src/main.zig"),
+            .root_source_file = b.path("src/test.zig"),
            .target = target,
            .optimize = optimize,
        }),
        .test_runner = .{ .path = b.path("test_runner.zig"), .mode = .simple },
    });

+    exe_tests.root_module.addImport("gpu", zig_wgpu.module("zig-wgpu"));
    const run_exe_tests = b.addRunArtifact(exe_tests);
    const test_step = b.step("test", "Run tests");
    test_step.dependOn(&run_exe_tests.step);
@ -30,6 +37,7 @@ pub fn build(b: *std.Build) void {
            .imports = &.{},
        }),
    });
+    bench_exe.root_module.addImport("gpu", zig_wgpu.module("zig-wgpu"));

    b.installArtifact(bench_exe);

--- a/build.zig.zon
+++ b/build.zig.zon
@ -1,9 +1,14 @@
 .{
    .name = .dimal,
-    .version = "0.1.0",
+    .version = "0.3.0",
    .fingerprint = 0x9453b1ff1e52d858,
    .minimum_zig_version = "0.16.0",
-    .dependencies = .{},
+    .dependencies = .{
+        .zig_wgpu = .{
+            .url = "git+https://git.bouvais.lu/adrien/zig-wgpu?ref=0.2.2#5f8da0940d77c40eacd39c268d09acbeaea0b2a5",
+            .hash = "zig_wgpu-0.2.0-xsLAy2-s0QPNwR2QNd8ZX2kWiVfV5oB92N3ga1V1Uwpu",
+        },
+    },
    .paths = .{
        "build.zig",
        "build.zig.zon",
--- a/release.md
+++ b/release.md
@ -1,11 +0,0 @@
-  Changed Quantity to Tensor that can use any shape and is a single @Vector.
-   Point being to add WebGPU easily from this.
-   Scalr suffer in performance tho, I will work on that
-
-Maybe I can do a jupiter like web interface with cells to make Dim analysis
-I could:
-  - Use cells with a toy language
-  - A nice debugger to display current variables with dimensions, type and value
-  - Realtime error (I try to compile at change, display error on the cell)
-  - Integrate a small graphic API that use Raylib canvas
-  - COuld generate template at comptime =o
--- a/docs/index.md
+++ b/docs/index.md
@ -1,253 +0,0 @@
-# dimal — Dimensional Analysis for Zig
-
-A dimensional analysis library for Zig with a unified `Tensor` API for scalars, vectors, matrices, and higher-dimensional data. All dimension and unit tracking happens at compile time—zero runtime overhead—and all operations use SIMD intrinsics.
-
-If you try to add meters to seconds, it won't compile. That's the point.
-
-> **Source:** [git.bouvais.lu/adrien/zig-dimal](https://git.bouvais.lu/adrien/zig-dimal)  
-> **Minimum Zig version:** `0.16.0`
-
---
-
-## Background
-
-Started because I needed `i128` positions for a space simulation to avoid floating-point precision loss far from the origin. Grew into a type system for tracking physical dimensions at compile time. It's been useful enough to share.
-
- **Compile-time dimension checking** — catch unit mismatches before runtime.
- **Unified `Tensor` API** — same interface for scalars, vectors, matrices, and higher-rank tensors.
- **SIMD operations** — vector and matrix code automatically uses SIMD instructions.
- **Zero runtime cost** — all dimension and scale tracking is erased at compile time.
- **Supports `i128`** — useful for high-precision fixed-point integer math.
-
---
-
-## Features
-
- **Compile-time dimension checking** — all physical-unit tracking happens at compile time.
- **Automatic unit conversion** — use `.to()` to convert between compatible units (e.g. `km/h` → `m/s`). Scale factors are resolved at comptime.
- **Unified `Tensor` API** — one type for scalars `{1}`, vectors `{N}`, matrices `{M, N}`, and higher-rank tensors.
- **SIMD operations** — vector and matrix code compiles to SIMD instructions automatically.
- **Tensor contraction** — `.contract(other, axis_a, axis_b)` for dot products, matrix multiplication, and general tensor contractions.
- **Full SI prefix support** — `pico` through `peta`, plus Imperial units and time scales.
- **Physical constants** — Planck, Boltzmann, speed of light, gravitational constant, etc.
- **Pre-built quantities** — `Velocity`, `Acceleration`, `Force`, `Energy`, `Pressure`, `Charge`, and more.
- **Basic vector operations** — cross product, length/magnitude, element-wise arithmetic.
- **Formatting** — values print with units: `9.81m.s⁻²`, `0.172km`.
-
-### Current Limitations
-
- GPU support not implemented.
- Performance on small tensors is limited by Zig's vector width.
-
---
-
-## The 7 SI Base Dimensions
-
-| Symbol | Dimension            | SI Unit |
-|--------|----------------------|---------|
-| `L`    | Length               | `m`     |
-| `M`    | Mass                 | `g`     |
-| `T`    | Time                 | `s`     |
-| `I`    | Electric Current     | `A`     |
-| `Tr`   | Temperature          | `K`     |
-| `N`    | Amount of Substance  | `mol`   |
-| `J`    | Luminous Intensity   | `cd`    |
-
---
-
-## Installation
-
-### 1. Add the dependency (Zig 0.14+)
-
-```sh
-zig fetch --save git+https://git.bouvais.lu/adrien/zig-dimal#0.2.0
-```
-
-### 2. Wire it up in `build.zig`
-
-```zig
-const std = @import("std");
-
-pub fn build(b: *std.Build) void {
-    const target = b.standardTargetOptions(.{});
-    const optimize = b.standardOptimizeOption(.{});
-    
-    const dimal = b.dependency("dimal", .{
-        .target = target,
-        .optimize = optimize,
-    }).module("dimal");
-
-    const exe = b.addExecutable(.{
-        .name = "my_app",
-        .root_source_file = b.path("src/main.zig"),
-        .target = target,
-        .optimize = optimize,
-    });
-    exe.root_module.addImport("dimal", dimal);
-    b.installArtifact(exe);
-}
-```
-
-### 3. Import and use
-
-```zig
-const dma = @import("dimal");
-const Tensor = dma.Tensor;
-const Base = dma.Base;
-```
-
---
-
-## Quick Example: Lunar Descent
-
-Simulate a spacecraft descending to the Moon with correct physics and type safety:
-
-```zig
-const std = @import("std");
-const dma = @import("dimal");
-const Tensor = dma.Tensor;
-
-pub fn main() void {
-    // Define types: m/s² acceleration, m/s velocity, m distance
-    const Acceleration = dma.Base.Acceleration.Of(f64);
-    const Velocity = dma.Base.Velocity.Of(f64);
-    const Distance = dma.Base.Meter.Of(f64);
-    const Time = dma.Base.Second.Of(f64);
-
-    // Initial conditions
-    const g_moon: Acceleration = .{ .data = @splat(1.62) };
-    const v_initial: Velocity = .{ .data = @splat(100.0) };
-    const h_initial: Distance = .{ .data = @splat(10000.0) };
-    const dt: Time = .{ .data = @splat(1.0) };
-
-    var h = h_initial;
-    var v = v_initial;
-    var t: f64 = 0;
-
-    // Simulate descent
-    while (h.data[0] > 0 and t < 1000) : (t += 1.0) {
-        // a = -g (gravity pulls down)
-        const a = g_moon.mul(-1.0);
-
-        // Update: v = v₀ + at
-        v = v.add(a.mul(dt));
-
-        // Update: h = h₀ + vt
-        h = h.add(v.mul(dt));
-
-        if (@mod(t, 100.0) == 0) {
-            std.debug.print("t={d:.0}s | h={d:.1} | v={d:.1}\n", .{
-                t,
-                h,
-                v,
-            });
-        }
-    }
-
-    std.debug.print("Landed in {d:.1}s at h={d:.1}\n", .{ t, h });
-}
-```
-
-**Output:**
-```
-t=0s | h=10000m | v=100m.s⁻¹
-t=100s | h=8019m | v=-61.8m.s⁻¹
-t=200s | h=4174.4m | v=-223.6m.s⁻¹
-...
-Landed in 323.5s at h=-0.01m
-```
-
---
-
-## API Overview
-
-### Tensors
-
-A **`Tensor`** is parameterized by:
- **`T`** — numeric type: `f32`, `f64`, `i128`, etc.
- **`dims`** — physical dimensions (struct literal): `.{.L = 1, .T = -1}` means length/time (velocity).
- **`scales`** — SI prefixes or custom scales: `.{.L = .k, .T = .hour}` means km/h.
- **`shape`** — array shape: `&.{1}` is a scalar, `&.{3}` is a 3-vector, `&.{3, 3}` is a 3×3 matrix.
-
-```zig
-// Scalar: 1-element tensor
-const Meter = Tensor(f64, .{.L = 1}, .{}, &.{1});
-const m = Meter{ .data = @splat(5.0) };
-
-// Vector: N-element tensor (SIMD)
-const Vec3Meter = Tensor(f64, .{.L = 1}, .{}, &.{3});
-const v = Vec3Meter{ .data = @shuffle(f64, [_]f64{1, 2, 3}, [_]f64 undefined, [_]i32{0, 1, 2, 0, 0, 0}) };
-
-// Matrix: M×N tensor (SIMD-accelerated)
-const Mat3x3Velocity = Tensor(f32, .{.L = 1, .T = -1}, .{}, &.{3, 3});
-const m_vel = Mat3x3Velocity{ .data = @splat(10.0) };
-
-// Higher-rank tensor
-const Rank4 = Tensor(f64, .{.M = 1}, .{}, &.{2, 3, 4, 5});
-```
-
-### Common Operations
-
-| Operation | Description |
-|-----------|-------------|
-| `.add(rhs)` | Element-wise addition. Auto-converts scales. |
-| `.sub(rhs)` | Element-wise subtraction. |
-| `.mul(rhs)` | Multiply; dimensions are summed. `rhs` can be a tensor or bare number. |
-| `.div(rhs)` | Divide; dimensions are subtracted. |
-| `.contract(other, axis_a, axis_b)` | Tensor contraction: dot product, matrix multiply, or general N-D contraction. |
-| `.cross(rhs)` | Cross product (3-vectors only). Returns a 3-vector. |
-| `.length()` / `.lengthSqr()` | Euclidean length (or squared length) of a vector. Returns a scalar `T`. |
-| `.product()` | Multiply all elements. Returns a scalar with combined dimensions. |
-| `.abs()` | Element-wise absolute value. Dimensions unchanged. |
-| `.pow(exp)` | Raise to comptime exponent. Dimension exponents multiplied by `exp`. |
-| `.sqrt()` | Element-wise square root. Compile error if any dimension exponent is odd. |
-| `.to(DestType)` | Convert to another unit of the same dimension. Comptime error on mismatch. |
-| `.eq(rhs)` / `.ne(rhs)` | Element-wise equality/inequality. |
-| `.gt(rhs)` / `.gte(rhs)` | Greater-than comparisons. |
-| `.lt(rhs)` / `.lte(rhs)` | Less-than comparisons. |
-
-### Pre-built Types (via `dma.Base`)
-
-Use `.Of(T)` for base units, `.Scaled(T, scales)` for custom scales:
-
-```zig
-const Velocity = dma.Base.Velocity.Of(f64);
-const Kmh = dma.Base.Velocity.Scaled(f64, .{.L = .k, .T = .hour});
-const Force = dma.Base.Force.Of(f32);
-const Energy = dma.Base.Energy.Of(f64);
-```
-
-Also available: `Acceleration`, `Inertia`, `Pressure`, `Power`, `Area`, `Volume`, `Density`, `Frequency`, `Viscosity`, `Charge`, `Potential`, `Resistance`, `MagneticFlux`, `ThermalCapacity`, `ThermalConductivity`, and many more.
-
---
-
-## SIMD Performance
-
-Operations on vectors and matrices use Zig's `@Vector` intrinsics, which compile to SIMD instructions on most platforms. This makes vector operations faster than equivalent scalar loops, but don't expect miracles—SIMD is still limited by memory bandwidth and CPU cache.
-
-Run the included benchmarks to see what you get on your hardware:
-```sh
-zig build benchmark
-```
-
---
-
-## Next Steps
-
- **GPU support** — eventually, for large tensor operations. WebGPU is a target.
- **Toy physics language** — I've been sketching ideas for a language optimized for numerical physics (tentatively called Éclat). It would use dimal as the foundation. No timeline yet; this is a long-term experiment.
-
---
-
-## Testing & Benchmarks
-
-```sh
-zig build test       # Run all unit tests
-zig build benchmark  # Run performance benchmarks
-```
-
---
-
-## License
-
-See the repository for license details.
--- a/docs/wishlist.md
+++ b/docs/wishlist.md
@ -1,3 +0,0 @@
-## GPU support with WebGPU
-
-Example: https://github.com/seyhajin/webgpu-wasm-zig
--- a/mkdocs.yml
+++ b/mkdocs.yml
@ -1,48 +0,0 @@
-site_name: Bouvais Docs
-site_url: https://zig-dimal.bouvais.lu
-site_description: A minimal technical documentation site.
-site_author: Adrien Bouvais
-
-theme:
-  name: material
-  language: en
-  # Color palette with auto light/dark mode
-  palette:
-    - media: "(prefers-color-scheme: light)"
-      scheme: default
-      primary: indigo
-      accent: indigo
-      toggle:
-        icon: material/brightness-7
-        name: Switch to dark mode
-    - media: "(prefers-color-scheme: dark)"
-      scheme: slate
-      primary: indigo
-      accent: indigo
-      toggle:
-        icon: material/brightness-4
-        name: Switch to light mode
-  
-  features:
-    - navigation.sections
-    - navigation.top
-    - content.code.copy
-    - content.code.annotate
-
-# Minimal plugins
-plugins:
-  - search
-
-# Your single page
-nav:
-  - Home: index.md
-
-# Extensions to make your markdown look better
-markdown_extensions:
-  - admonition
-  - pymdownx.details
-  - pymdownx.superfences
-  - pymdownx.highlight:
-      anchor_linenums: true
-  - pymdownx.inlinehilite
-  - attr_list
--- a/src/Base.zig
+++ b/src/Base.zig
@ -3,7 +3,7 @@ const std = @import("std");
 // Adjust these imports to match your actual file names
 const Dimensions = @import("Dimensions.zig");
 const Scales = @import("Scales.zig");
-const Tensor = @import("Tensor.zig").Tensor;
+const Tensor = @import("TensorStatic.zig").Tensor;

 fn PhysicalConstant(comptime d: Dimensions.ArgOpts, comptime val: f64, comptime s: Scales.ArgOpts) type {
    return struct {
@ -60,7 +60,7 @@ pub const Constants = struct {
    /// Newtonian constant of gravitation (G) [m³⋅kg⁻¹⋅s⁻²]
    pub const Gravitational = PhysicalConstant(.{ .M = -1, .L = 3, .T = -2 }, 6.67430e-11, .{ .M = .k });

-    /// Stefan–Boltzmann constant (σ) [W⋅m⁻²⋅K⁻⁴ = kg⋅s⁻³⋅K⁻⁴]
+    /// Stefan-Boltzmann constant () [W⋅m⁻²⋅K⁻⁴ = kg⋅s⁻³⋅K⁻⁴]
    pub const StefanBoltzmann = PhysicalConstant(.{ .M = 1, .T = -3, .Tp = -4 }, 5.670374419e-8, .{ .M = .k });

    /// Elementary charge (e) [C = A⋅s]
@ -81,7 +81,7 @@ pub const Constants = struct {
    /// Neutron mass (m_n) [kg]
    pub const NeutronMass = PhysicalConstant(.{ .M = 1 }, 1.67492750056e-27, .{ .M = .k });

-    /// Fine-structure constant (α) [Dimensionless]
+    /// Fine-structure constant () [Dimensionless]
    pub const FineStructure = PhysicalConstant(.{}, 0.0072973525643, .{});

    /// Avogadro constant (N_A) [mol⁻¹]
--- a/src/Dimensions.zig
+++ b/src/Dimensions.zig
@ -1,13 +1,13 @@
 const std = @import("std");

 pub const ArgOpts = struct {
-    L: comptime_int = 0,
-    M: comptime_int = 0,
-    T: comptime_int = 0,
-    I: comptime_int = 0,
-    Tp: comptime_int = 0,
-    N: comptime_int = 0,
-    J: comptime_int = 0,
+    L: isize = 0,
+    M: isize = 0,
+    T: isize = 0,
+    I: isize = 0,
+    Tp: isize = 0,
+    N: isize = 0,
+    J: isize = 0,
 };

 pub const Dimension = enum {
--- a/src/Scales.zig
+++ b/src/Scales.zig
@ -59,7 +59,8 @@ pub const UnitScale = enum(isize) {
        var buf: [16]u8 = undefined;
        return switch (self) {
            .none => "",
-            .P, .T, .G, .M, .k, .h, .da, .d, .c, .m, .u, .n, .p, .f, .min, .hour, .year, .inch, .ft, .yd, .mi, .oz, .lb, .st => @tagName(self),
+            .P, .T, .G, .M, .k, .h, .da, .d, .c, .m, .u, .n, .p, .f, .min, .year, .inch, .ft, .yd, .mi, .oz, .lb, .st => @tagName(self),
+            .hour => "h",
            else => std.fmt.bufPrint(&buf, "[{d}]", .{@intFromEnum(self)}) catch "[]", // This cannot be inline because of non exhaustive enum, but that's ok, it is just str, not calculation
        };
    }
--- a/src/TensorAlloc.zig
+++ b/src/TensorAlloc.zig
--- a/src/TensorGpu.zig
+++ b/src/TensorGpu.zig
--- a/src/TensorStatic.zig
+++ b/src/TensorStatic.zig
--- a/src/UnitParser.zig
+++ b/src/UnitParser.zig
@ -0,0 +1,145 @@
+const std = @import("std");
+const Dimensions = @import("Dimensions.zig");
+const Scales = @import("Scales.zig");
+
+/// A container returning the separated arguments needed to construct a Tensor.
+pub const ParsedUnit = struct {
+    dims: Dimensions.ArgOpts = .{},
+    scales: Scales.ArgOpts = .{},
+};
+
+pub const UnitParseError = error{
+    UnknownBaseUnit,
+    UnknownPrefix,
+    InvalidExponent,
+    EmptyStr,
+};
+
+/// Parses strings like "km/s^2", "m", "kg*m/s^2", "1/min".
+/// Evaluates entirely at comptime.
+pub fn parseUnit(str: []const u8) !ParsedUnit {
+    if (str.len == 0) return UnitParseError.EmptyStr;
+
+    var parsed: ParsedUnit = .{ .dims = .{}, .scales = .{} };
+
+    // We need to track if we are after a '/' to flip exponents to negative
+    var is_denominator = false;
+
+    // Manual iteration to handle '/' properly
+    var cursor: usize = 0;
+    while (cursor < str.len) {
+        // Find the next segment
+        const segment_start = cursor;
+        while (cursor < str.len and str[cursor] != '/' and str[cursor] != '.' and str[cursor] != '*') : (cursor += 1) {}
+        const segment = str[segment_start..cursor];
+
+        if (segment.len > 0) {
+            try parseSegment(segment, &parsed, is_denominator);
+        }
+
+        if (cursor < str.len) {
+            if (str[cursor] == '/') {
+                is_denominator = true;
+            }
+            cursor += 1; // skip the separator
+        }
+    }
+
+    return parsed;
+}
+
+fn parseSegment(segment: []const u8, parsed: *ParsedUnit, is_denominator: bool) !void {
+    var scale: Scales.UnitScale = .none;
+    var found_scale = false;
+    var active_dim: ?Dimensions.Dimension = null;
+
+    // 1. Try to find a Scale + Dimension pair (e.g., "mm", "km")
+    inline for (std.enums.values(Scales.UnitScale)) |sca| {
+        const s_str = sca.str();
+        if (s_str.len > 0 and std.mem.startsWith(u8, segment, s_str)) {
+            // Check if it's a "Unit-as-Scale" (hour, min) or a prefix (k, m, c)
+            switch (sca) {
+                .hour, .min, .year => {
+                    // These are dimensions themselves (Time)
+                    if (segment.len == s_str.len or (segment.len > s_str.len and (segment[s_str.len] == '^' or (segment[s_str.len] >= '0' and segment[s_str.len] <= '9')))) {
+                        scale = sca;
+                        active_dim = .T;
+                        found_scale = true;
+                    }
+                },
+                else => {
+                    // Standard prefixes: Must be followed by a valid dimension unit
+                    inline for (std.enums.values(Dimensions.Dimension)) |dim| {
+                        if (std.mem.startsWith(u8, segment[s_str.len..], dim.unit())) {
+                            scale = sca;
+                            active_dim = dim;
+                            found_scale = true;
+                            break;
+                        }
+                    }
+                },
+            }
+        }
+        if (found_scale) break;
+    }
+
+    // 2. If no scale prefix was found, try identifying as a pure Dimension (e.g., "m", "s")
+    if (!found_scale) {
+        inline for (std.enums.values(Dimensions.Dimension)) |dim| {
+            if (std.mem.startsWith(u8, segment, dim.unit())) {
+                active_dim = dim;
+                break;
+            }
+        }
+    }
+
+    const dimen = active_dim orelse return UnitParseError.UnknownBaseUnit;
+
+    // 3. Determine where the exponent starts
+    // If it was a Time Scale (like 'h'), the exponent starts after 'h'
+    // If it was a Prefix + Dim (like 'km'), it starts after 'km'
+    const unit_part_len = if (found_scale)
+        (if (scale == .hour or scale == .min or scale == .year) scale.str().len else scale.str().len + dimen.unit().len)
+    else
+        dimen.unit().len;
+
+    const expo_str = segment[unit_part_len..];
+
+    // 4. Parse Exponent
+    var expo: i32 = 1;
+    if (expo_str.len > 0) {
+        const cleaned_expo = if (expo_str[0] == '^') expo_str[1..] else expo_str;
+        expo = std.fmt.parseInt(i32, cleaned_expo, 10) catch return UnitParseError.InvalidExponent;
+    }
+
+    if (is_denominator) expo *= -1;
+
+    // 5. Assign to struct
+    inline for (std.meta.fields(Dimensions.ArgOpts)) |f| {
+        if (std.mem.eql(u8, f.name, @tagName(dimen))) {
+            @field(parsed.dims, f.name) += expo;
+            @field(parsed.scales, f.name) = scale;
+        }
+    }
+}
+
+inline fn testParser(
+    comptime str: []const u8,
+    comptime expected_dims: Dimensions.ArgOpts,
+    comptime expected_scales: Scales.ArgOpts,
+) !void {
+    const unit = comptime try parseUnit(str);
+    if (comptime !Dimensions.init(expected_dims).eql(Dimensions.init(unit.dims))) return error.WrongDims;
+    if (comptime !Scales.init(expected_scales).eql(Scales.init(unit.scales))) return error.WrongScales;
+}
+
+test "parseUnit" {
+    @setEvalBranchQuota(10000);
+    try testParser("m", .{ .L = 1 }, .{});
+    try testParser("s", .{ .T = 1 }, .{});
+    try testParser("mm", .{ .L = 1 }, .{ .L = .m });
+    try testParser("m/s", .{ .L = 1, .T = -1 }, .{});
+    try testParser("m1/s2/kg", .{ .L = 1, .T = -2, .M = -1 }, .{ .M = .k });
+    try testParser("km/h", .{ .L = 1, .T = -1 }, .{ .L = .k, .T = .hour });
+    try testParser("m.s^-1", .{ .L = 1, .T = -1 }, .{});
+}
--- a/src/benchmark.zig
+++ b/src/benchmark.zig
@ -10,22 +10,7 @@ pub fn main(init: std.process.Init) !void {

    io = init.io;

-    // try vectorSIMDvsNative(f64, &stdout_writer.interface);
-    // try stdout_writer.flush();
-    // try vectorSIMDvsNative(f32, &stdout_writer.interface);
-    // try stdout_writer.flush();
-    // try vectorSIMDvsNative(i32, &stdout_writer.interface);
-    // try stdout_writer.flush();
-    // try vectorSIMDvsNative(i64, &stdout_writer.interface);
-    // try stdout_writer.flush();
-    // try vectorSIMDvsNative(i128, &stdout_writer.interface);
-    // try stdout_writer.flush();
-    //
-    // try bench_Scalar(&stdout_writer.interface);
-    // try stdout_writer.flush();
-    try bench_vsNative(&stdout_writer.interface);
-    try stdout_writer.flush();
-    // try bench_crossTypeVsNative(&stdout_writer.interface);
+    try bench_Scalar(&stdout_writer.interface);
    try stdout_writer.flush();
    try bench_Vector(&stdout_writer.interface);
    try stdout_writer.flush();
@ -128,7 +113,7 @@ fn bench_Scalar(writer: *std.Io.Writer) !void {
                            else if (comptime std.mem.eql(u8, op_name, "gt"))
                                (M.splat(getVal(T, i, 63))).gt(M.splat(getVal(T, i +% 3, 63)))
                            else
-                                (M.splat(getVal(T, i, 63))).mul(3);
+                                (M.splat(getVal(T, i, 63))).mul(M.splat(3));
                        },
                    );
                }
@ -169,247 +154,6 @@ fn bench_Scalar(writer: *std.Io.Writer) !void {
    try writer.print("└──────────────┴───────┴───────┴───────┴───────┴───────┴───────┴───────┘\n", .{});
 }

-fn bench_vsNative(writer: *std.Io.Writer) !void {
-    const ITERS: usize = 100_000;
-    const SAMPLES: usize = 100;
-
-    const getValT = struct {
-        fn f(comptime TT: type, i: usize) TT {
-            const v = (i % 100) + 1;
-            return if (comptime @typeInfo(TT) == .float) @floatFromInt(v) else @intCast(v);
-        }
-    }.f;
-
-    const Types = .{ f64, i64, i128, f32, f64 };
-    const TNames = .{ "f64", "i64", "i128", "f32", "f64" };
-    // Expanded Ops to match bench_Scalar
-    const Ops = .{ "add", "sub", "mul", "div", "abs", "eq", "gt" };
-
-    try writer.print(
-        \\
-        \\ Scalar vs Native Overhead Analysis
-        \\
-        \\┌───────────┬──────┬───────────┬───────────┬───────────┬───────────────────────┐
-        \\│ Operation │ Type │ Native    │ @Vector   │ Tensor{{1}} │ Slowdown  Nat | Vec   │
-        \\├───────────┼──────┼───────────┼───────────┼───────────┼───────────────────────┤
-        \\
-    , .{});
-
-    inline for (Ops, 0..) |op_name, j| {
-        inline for (Types, 0..) |T, tidx| {
-            var native_total_ns: f64 = 0;
-            var vector_total_ns: f64 = 0;
-            var tensor_total_ns: f64 = 0;
-
-            const M = Tensor(T, .{}, .{}, &.{1});
-
-            std.mem.doNotOptimizeAway({
-                for (0..SAMPLES) |_| {
-                    // --- 1. Benchmark Native ---
-                    const n_start = getTime();
-                    const a = getValT(T, 10);
-                    const b = getValT(T, 2);
-                    for (0..ITERS) |_| {
-                        // Native logic branch
-                        _ = if (comptime std.mem.eql(u8, op_name, "add"))
-                            if (comptime @typeInfo(T) == .int) a +| b else a + b
-                        else if (comptime std.mem.eql(u8, op_name, "sub"))
-                            if (comptime @typeInfo(T) == .int) a -| b else a - b
-                        else if (comptime std.mem.eql(u8, op_name, "mul"))
-                            if (comptime @typeInfo(T) == .int) a *| b else a * b
-                        else if (comptime std.mem.eql(u8, op_name, "div"))
-                            if (comptime @typeInfo(T) == .int) @divTrunc(a, b) else a / b
-                        else if (comptime std.mem.eql(u8, op_name, "abs"))
-                            if (comptime @typeInfo(T) == .int) @abs(a) else @as(T, @abs(a))
-                        else if (comptime std.mem.eql(u8, op_name, "eq"))
-                            a == b
-                        else if (comptime std.mem.eql(u8, op_name, "gt"))
-                            a > b
-                        else
-                            unreachable;
-                    }
-                    const n_end = getTime();
-                    native_total_ns += @as(f64, @floatFromInt(n_start.durationTo(n_end).toNanoseconds()));
-
-                    const v_start = getTime();
-                    const va = getValT(T, 10);
-                    const vb = getValT(T, 2);
-                    for (0..ITERS) |_| {
-                        // Native logic branch
-                        _ = if (comptime std.mem.eql(u8, op_name, "add"))
-                            if (comptime @typeInfo(T) == .int) va +| vb else va + vb
-                        else if (comptime std.mem.eql(u8, op_name, "sub"))
-                            if (comptime @typeInfo(T) == .int) va -| vb else va - vb
-                        else if (comptime std.mem.eql(u8, op_name, "mul"))
-                            if (comptime @typeInfo(T) == .int) va *| vb else va * vb
-                        else if (comptime std.mem.eql(u8, op_name, "div"))
-                            if (comptime @typeInfo(T) == .int) @divTrunc(va, vb) else va / vb
-                        else if (comptime std.mem.eql(u8, op_name, "abs"))
-                            if (comptime @typeInfo(T) == .int) @abs(va) else @as(T, @abs(va))
-                        else if (comptime std.mem.eql(u8, op_name, "eq"))
-                            va == vb
-                        else if (comptime std.mem.eql(u8, op_name, "gt"))
-                            va > vb
-                        else
-                            unreachable;
-                    }
-                    const v_end = getTime();
-                    vector_total_ns += @as(f64, @floatFromInt(v_start.durationTo(v_end).toNanoseconds()));
-
-                    // --- 2. Benchmark Scalar ---
-                    const q_start = getTime();
-                    const qa = M.splat(getValT(T, 10));
-                    const qb = M.splat(getValT(T, 2));
-                    for (0..ITERS) |_| {
-                        // Scalar logic branch
-                        _ = if (comptime std.mem.eql(u8, op_name, "add"))
-                            qa.add(qb)
-                        else if (comptime std.mem.eql(u8, op_name, "sub"))
-                            qa.sub(qb)
-                        else if (comptime std.mem.eql(u8, op_name, "mul"))
-                            qa.mul(qb)
-                        else if (comptime std.mem.eql(u8, op_name, "div"))
-                            qa.div(qb)
-                        else if (comptime std.mem.eql(u8, op_name, "abs"))
-                            qa.abs()
-                        else if (comptime std.mem.eql(u8, op_name, "eq"))
-                            qa.eq(qb)
-                        else if (comptime std.mem.eql(u8, op_name, "gt"))
-                            qa.gt(qb)
-                        else
-                            unreachable;
-                    }
-                    const q_end = getTime();
-                    tensor_total_ns += @as(f64, @floatFromInt(q_start.durationTo(q_end).toNanoseconds()));
-                }
-            });
-
-            const avg_n = (native_total_ns / SAMPLES) / @as(f64, @floatFromInt(ITERS));
-            const avg_v = (vector_total_ns / SAMPLES) / @as(f64, @floatFromInt(ITERS));
-            const avg_t = (tensor_total_ns / SAMPLES) / @as(f64, @floatFromInt(ITERS));
-            const slowdown_nt = avg_t / avg_n;
-            const slowdown_vt = avg_t / avg_v;
-
-            try writer.print("│ {s:<9} │ {s:<4} │ {d:>7.2}ns │ {d:>7.2}ns │ {d:>7.2}ns │ {d:>8.2}x   {d:>8.2}x │\n", .{
-                op_name, TNames[tidx], avg_n, avg_v, avg_t, slowdown_nt, slowdown_vt,
-            });
-        }
-        if (j != Ops.len - 1) try writer.print("├───────────┼──────┼───────────┼───────────┼───────────┼───────────────────────┤\n", .{});
-    }
-
-    try writer.print("└───────────┴──────┴───────────┴───────────┴───────────┴───────────────────────┘\n", .{});
-}
-
-fn bench_crossTypeVsNative(writer: *std.Io.Writer) !void {
-    const ITERS: usize = 100_000;
-    const SAMPLES: usize = 5;
-
-    const getValT = struct {
-        fn f(comptime TT: type, i: usize) TT {
-            // Keep values safe and non-zero to avoid division by zero or overflows during cross-casting
-            const v = (i % 50) + 1;
-            return if (comptime @typeInfo(TT) == .float) @floatFromInt(v) else @intCast(v);
-        }
-    }.f;
-
-    // Helper for the Native baseline: explicitly casting T2 to T1 before the operation
-    const castTo = struct {
-        fn f(comptime DestT: type, comptime SrcT: type, val: SrcT) DestT {
-            if (comptime DestT == SrcT) return val;
-            const src_info = @typeInfo(SrcT);
-            const dest_info = @typeInfo(DestT);
-
-            if (dest_info == .int and src_info == .int) return @intCast(val);
-            if (dest_info == .float and src_info == .int) return @floatFromInt(val);
-            if (dest_info == .int and src_info == .float) return @intFromFloat(val);
-            if (dest_info == .float and src_info == .float) return @floatCast(val);
-            unreachable;
-        }
-    }.f;
-
-    const Types = .{ i16, i64, i128, f32, f64 };
-    const TNames = .{ "i16", "i64", "i128", "f32", "f64" };
-    const Ops = .{ "add", "mul", "div" };
-
-    try writer.print(
-        \\
-        \\ Cross-Type Overhead Analysis: Scalar vs Native
-        \\
-        \\┌─────────┬──────┬──────┬───────────┬───────────┬───────────┐
-        \\│ Op      │ T1   │ T2   │ Native    │ Scalar    │ Slowdown  │
-        \\├─────────┼──────┼──────┼───────────┼───────────┼───────────┤
-        \\
-    , .{});
-
-    inline for (Ops, 0..) |op_name, j| {
-        inline for (Types, 0..) |T1, t1_idx| {
-            inline for (Types, 0..) |T2, t2_idx| {
-                var native_total_ns: f64 = 0;
-                var quantity_total_ns: f64 = 0;
-
-                const M1 = Tensor(T1, .{ .L = 1 }, .{}, &.{1});
-                const M2 = Tensor(T2, .{ .L = 1 }, .{}, &.{1});
-                const S2 = Tensor(T2, .{ .T = 1 }, .{}, &.{1});
-
-                std.mem.doNotOptimizeAway({
-                    for (0..SAMPLES) |_| {
-                        // --- 1. Benchmark Native (Cast T2 to T1, then math) ---
-                        const n_start = getTime();
-                        for (0..ITERS) |i| {
-                            const a = getValT(T1, i);
-                            const b_raw = getValT(T2, 2);
-                            const b = castTo(T1, T2, b_raw);
-
-                            _ = if (comptime std.mem.eql(u8, op_name, "add"))
-                                a + b
-                            else if (comptime std.mem.eql(u8, op_name, "mul"))
-                                a * b
-                            else if (comptime @typeInfo(T1) == .int)
-                                @divTrunc(a, b)
-                            else
-                                a / b;
-                        }
-                        const n_end = getTime();
-                        native_total_ns += @as(f64, @floatFromInt(n_start.durationTo(n_end).toNanoseconds()));
-
-                        // --- 2. Benchmark Scalar ---
-                        const q_start = getTime();
-                        for (0..ITERS) |i| {
-                            const qa = M1.splat(getValT(T1, i));
-                            const qb = if (comptime std.mem.eql(u8, op_name, "div"))
-                                S2.splat(getValT(T2, 2))
-                            else
-                                M2.splat(getValT(T2, 2));
-
-                            _ = if (comptime std.mem.eql(u8, op_name, "add"))
-                                qa.add(qb)
-                            else if (comptime std.mem.eql(u8, op_name, "mul"))
-                                qa.mul(qb)
-                            else
-                                qa.div(qb);
-                        }
-                        const q_end = getTime();
-                        quantity_total_ns += @as(f64, @floatFromInt(q_start.durationTo(q_end).toNanoseconds()));
-                    }
-
-                    const avg_n = (native_total_ns / SAMPLES) / @as(f64, @floatFromInt(ITERS));
-                    const avg_q = (quantity_total_ns / SAMPLES) / @as(f64, @floatFromInt(ITERS));
-                    const slowdown = avg_q / avg_n;
-
-                    try writer.print("│ {s:<7} │ {s:<4} │ {s:<4} │ {d:>7.2}ns │ {d:>7.2}ns │ {d:>8.2}x │\n", .{
-                        op_name, TNames[t1_idx], TNames[t2_idx], avg_n, avg_q, slowdown,
-                    });
-                });
-            }
-        }
-        if (j != Ops.len - 1) {
-            try writer.print("├─────────┼──────┼──────┼───────────┼───────────┼───────────┤\n", .{});
-        }
-    }
-
-    try writer.print("└─────────┴──────┴──────┴───────────┴───────────┴───────────┘\n", .{});
-}
-
 fn bench_Vector(writer: *std.Io.Writer) !void {
    const ITERS: usize = 10_000;
    const SAMPLES: usize = 10;
@ -448,7 +192,7 @@ fn bench_Vector(writer: *std.Io.Writer) !void {
    const TNames = .{ "i32", "i64", "i128", "f32", "f64" };
    const Lengths = .{ 1, 3, 4, 16, 100 };
    // "cross" is only valid for len=3; other cells will show "  ---  "
-    const Ops = .{ "add", "div", "mulScalar", "dot", "cross", "product", "pow", "length" };
+    const Ops = .{ "add", "div", "mulScalar", "dot", "product", "pow", "length" };

    inline for (Ops, 0..) |op_name, o_idx| {
        inline for (Types, TNames) |T, tname| {
@ -484,10 +228,6 @@ fn bench_Vector(writer: *std.Io.Writer) !void {
                            } else if (comptime std.mem.eql(u8, op_name, "dot")) {
                                const v2 = V.splat(getVal(T, i +% 5, 63));
                                _ = v1.contract(v2, 0, 0);
-                            } else if (comptime std.mem.eql(u8, op_name, "cross")) {
-                                // len == 3 guaranteed by the guard above
-                                const v2 = V.splat(getVal(T, i +% 5, 63));
-                                _ = v1.cross(v2);
                            } else if (comptime std.mem.eql(u8, op_name, "product")) {
                                _ = v1.product();
                            } else if (comptime std.mem.eql(u8, op_name, "pow")) {
@ -610,62 +350,3 @@ fn bench_HighDimTensor(writer: *std.Io.Writer) !void {
    }
    try writer.print("└─────────────────┴──────┴──────────────┴──────────────┴──────────────┴──────────────┘\n", .{});
 }
-
-fn vectorSIMDvsNative(comptime T: type, writer: *std.Io.Writer) !void {
-    const iterations: u64 = 10_000;
-    const lens = [_]u32{ 1, 2, 3, 4, 5, 10, 100, 1_000, 10_000 };
-
-    try writer.print("\nSIMD Speedup Analysis: {s}\n", .{@typeName(T)});
-    try writer.print("┌────────────┬────────────┬────────────┬────────────┐\n", .{});
-    try writer.print("│ Vector Len │ Scalar (us)│ Vector (us)│ Speedup    │\n", .{});
-    try writer.print("├────────────┼────────────┼────────────┼────────────┤\n", .{});
-
-    inline for (lens) |vector_len| {
-        // --- Scalar Test ---
-        var scalar_val: T = 10;
-        const start_scalar = getTime();
-
-        var i: u64 = 0;
-        while (i < iterations * vector_len) : (i += 1) {
-            if (comptime @typeInfo(T) == .int)
-                scalar_val = scalar_val +% 1
-            else
-                scalar_val = scalar_val + 1;
-        }
-        const scalar_time = start_scalar.durationTo(getTime()).toMicroseconds();
-
-        // --- Vector Test ---
-        var vector_val: @Vector(vector_len, T) = @splat(20);
-        const start_vector = getTime();
-
-        i = 0;
-        const increment: @Vector(vector_len, T) = @splat(1);
-        while (i < iterations) : (i += 1) {
-            if (comptime @typeInfo(T) == .int)
-                vector_val = vector_val +% increment
-            else
-                vector_val = vector_val + increment;
-        }
-        const vector_time = start_vector.durationTo(getTime()).toMicroseconds();
-
-        // --- Results ---
-        const s_float = @as(f64, @floatFromInt(scalar_time));
-        const v_float = @as(f64, @floatFromInt(vector_time));
-
-        // Speedup = ScalarTime / VectorTime.
-        // > 1.0 means SIMD is faster.
-        const speedup = if (vector_time > 0) s_float / v_float else 0;
-
-        try writer.print("│ {d:<10} │ {d:>10} │ {d:>10} │ {d:>9.2}x │\n", .{
-            vector_len,
-            scalar_time,
-            vector_time,
-            speedup,
-        });
-        try writer.flush();
-
-        std.mem.doNotOptimizeAway(scalar_val);
-        std.mem.doNotOptimizeAway(vector_val);
-    }
-    try writer.print("└────────────┴────────────┴────────────┴────────────┘\n", .{});
-}
--- a/src/lib.zig
+++ b/src/lib.zig
@ -0,0 +1,9 @@
+const std = @import("std");
+
+pub const TensorStatic = @import("TensorStatic.zig").Tensor;
+pub const TensorAlloc = @import("TensorAlloc.zig").Tensor;
+pub const TensorGpu = @import("TensorGpu.zig").Tensor;
+pub const Dimensions = @import("Dimensions.zig");
+pub const Scales = @import("Scales.zig");
+pub const Base = @import("Base.zig");
+pub const UnitParser = @import("UnitParser.zig");
--- a/src/main.zig
+++ b/src/main.zig
@ -1,13 +0,0 @@
-const std = @import("std");
-
-pub const Tensor = @import("Tensor.zig").Tensor;
-pub const Dimensions = @import("Dimensions.zig");
-pub const Scales = @import("Scales.zig");
-pub const Base = @import("Base.zig");
-
-test {
-    _ = @import("Tensor.zig");
-    _ = @import("Dimensions.zig");
-    _ = @import("Scales.zig");
-    _ = @import("Base.zig");
-}
--- a/src/shared.zig
+++ b/src/shared.zig
@ -0,0 +1,155 @@
+const std = @import("std");
+const Scales = @import("Scales.zig");
+const UnitScale = Scales.UnitScale;
+const Dimensions = @import("Dimensions.zig");
+const Dimension = Dimensions.Dimension;
+
+pub const TensorKind = enum { static, alloc, gpu };
+
+pub fn isTensor(comptime T: type) bool {
+    return comptime @typeInfo(T) == .@"struct" and @hasDecl(T, "ISTENSOR");
+}
+
+pub fn shapeTotal(shape: []const comptime_int) usize {
+    var t: comptime_int = 1;
+    for (shape) |s| t *= s;
+    return t;
+}
+
+/// Check if two shapes are strictly identical.
+pub fn shapeEql(a: []const comptime_int, b: []const comptime_int) bool {
+    if (a.len != b.len) return false;
+    for (a, 0..) |v, i|
+        if (v != b[i]) return false;
+    return true;
+}
+
+/// Row-major (C-order) strides: strides[i] = product(shape[i+1..]).
+///   e.g. shape {3, 4} → strides {4, 1}
+///        shape {2, 3, 4} → strides {12, 4, 1}
+pub fn shapeStrides(shape: []const comptime_int) [shape.len]comptime_int {
+    var st: [shape.len]comptime_int = undefined;
+    if (shape.len == 0) return st;
+    st[shape.len - 1] = 1;
+    if (shape.len > 1) {
+        var i: comptime_int = shape.len - 1;
+        while (i > 0) : (i -= 1) st[i - 1] = st[i] * shape[i];
+    }
+    return st;
+}
+
+/// Return a copy of `shape` with the element at `axis` removed.
+pub fn shapeRemoveAxis(shape: []const comptime_int, axis: comptime_int) [shape.len - 1]comptime_int {
+    var out: [shape.len - 1]comptime_int = undefined;
+    var j: comptime_int = 0;
+    for (shape, 0..) |v, i| {
+        if (i != axis) {
+            out[j] = v;
+            j += 1;
+        }
+    }
+    return out;
+}
+
+/// Concatenate two compile-time slices.
+pub fn shapeCat(a: []const comptime_int, b: []const comptime_int) [a.len + b.len]comptime_int {
+    var out: [a.len + b.len]comptime_int = undefined;
+    for (a, 0..) |v, i| out[i] = v;
+    for (b, 0..) |v, i| out[a.len + i] = v;
+    return out;
+}
+
+/// Decode a flat row-major index into N-D coordinates.
+/// Called only in comptime contexts (all arguments are comptime).
+pub fn decodeFlatCoords(flat: comptime_int, n: comptime_int, strd: [n]comptime_int) [n]usize {
+    var coords: [n]comptime_int = undefined;
+    var tmp = flat;
+    for (0..n) |i| {
+        coords[i] = if (strd[i] == 0) 0 else tmp / strd[i];
+        tmp = if (strd[i] == 0) 0 else tmp % strd[i];
+    }
+    return coords;
+}
+
+/// Encode N-D coordinates into a flat row-major index.
+/// Called only in comptime contexts.
+pub fn encodeFlatCoords(coords: []const usize, n: usize, strd: [n]usize) usize {
+    var flat: usize = 0;
+    for (0..n) |i| flat += coords[i] * strd[i];
+    return flat;
+}
+
+/// Rebuild a full coordinate array by inserting `val` at `axis` into `free`.
+/// `free` holds the remaining (non-contracted) coordinates in order.
+pub fn insertAxis(
+    comptime n: usize,
+    comptime axis: usize,
+    comptime val: usize,
+    comptime free: []const usize,
+) [n]usize {
+    var out: [n]usize = undefined;
+    var fi: usize = 0;
+    for (0..n) |i| {
+        if (i == axis) {
+            out[i] = val;
+        } else {
+            out[i] = free[fi];
+            fi += 1;
+        }
+    }
+    return out;
+}
+
+pub inline fn isInt(comptime T: type) bool {
+    return @typeInfo(T) == .int or @typeInfo(T) == .comptime_int;
+}
+
+pub fn finerScales(comptime T1: type, comptime T2: type) Scales {
+    const d1: Dimensions = T1.dims;
+    const d2: Dimensions = T2.dims;
+    const s1: Scales = T1.scales;
+    const s2: Scales = T2.scales;
+    comptime var out = Scales.initFill(.none);
+    for (std.enums.values(Dimension)) |dim| {
+        const scale1 = comptime s1.get(dim);
+        const scale2 = comptime s2.get(dim);
+        out.set(dim, if (comptime d1.get(dim) == 0 and d2.get(dim) == 0)
+            .none
+        else if (comptime d1.get(dim) == 0)
+            scale2
+        else if (comptime d2.get(dim) == 0)
+            scale1
+        else if (comptime scale1.getFactor() > scale2.getFactor())
+            scale2
+        else
+            scale1);
+    }
+    return out;
+}
+
+pub fn printSuperscript(writer: *std.Io.Writer, n: i32) !void {
+    if (n == 0) return;
+    var val = n;
+    if (val < 0) {
+        try writer.writeAll("\u{207B}");
+        val = -val;
+    }
+    var buf: [12]u8 = undefined;
+    const str = std.fmt.bufPrint(&buf, "{d}", .{val}) catch return;
+    for (str) |c| {
+        const s = switch (c) {
+            '0' => "\u{2070}",
+            '1' => "\u{00B9}",
+            '2' => "\u{00B2}",
+            '3' => "\u{00B3}",
+            '4' => "\u{2074}",
+            '5' => "\u{2075}",
+            '6' => "\u{2076}",
+            '7' => "\u{2077}",
+            '8' => "\u{2078}",
+            '9' => "\u{2079}",
+            else => unreachable,
+        };
+        try writer.writeAll(s);
+    }
+}
--- a/src/test.zig
+++ b/src/test.zig
@ -0,0 +1,9 @@
+test {
+    _ = @import("TensorStatic.zig");
+    _ = @import("TensorAlloc.zig");
+    _ = @import("TensorGpu.zig");
+    _ = @import("Dimensions.zig");
+    _ = @import("Scales.zig");
+    _ = @import("Base.zig");
+    _ = @import("UnitParser.zig");
+}
Author	SHA1	Message	Date
adrien	22ffd4fc64	Fix TensorAlloc copy that was copying the ptr	2026-05-27 21:15:58 +02:00
adrien	9ac3d4d699	Squeletton TensorGpu that init	2026-05-26 23:34:53 +02:00
adrien	2215a5d86d	Added TensorStatic and Alloc to lib.zig	2026-05-26 20:06:36 +02:00
adrien	9deb25b825	Updated zon version	2026-05-26 20:01:04 +02:00
adrien	ceff8ff1bd	Added everything to TensorAlloc	2026-05-25 22:52:27 +02:00
adrien	ff21f0ac8b	Added all operation and test for TensorAlloc, missing slice	2026-05-25 18:18:35 +02:00
adrien	5ac9968021	Added back more test for TensorAlloc	2026-05-25 13:53:17 +02:00
adrien	8028cf41a5	Removed inline for TensorAlloc fn	2026-05-25 01:54:47 +02:00
adrien	0ef19e18de	Working other base operation (sub, mul, div, ect)	2026-05-25 01:52:12 +02:00
adrien	7494595db4	Working TensorAlloc add	2026-05-25 01:44:09 +02:00
adrien	91c5c41fc5	Working comparaison for TensorAlloc	2026-05-24 21:23:20 +02:00
adrien	ba671ee486	Working basic eq between TensorAlloc	2026-05-24 18:40:14 +02:00
adrien	09d6ca1ff5	Renamed Tensor to TensorStatic	2026-05-23 10:29:57 +02:00
adrien	bcd888d59e	Splited main.zig into lib and test.zig	2026-05-20 23:02:30 +02:00
adrien	63e9b6b63d	Removed vs native benchmarks	2026-05-20 22:58:36 +02:00
adrien	957f75243f	Added zig-wgpu import	2026-05-20 16:03:15 +02:00
adrien	5f833a5e58	Removed TensorAlloc and made TensorStatic back to just Tensor Realized I can just do alloc.create instead of a all new struct	2026-05-15 00:46:22 +02:00
adrien	00e0f5ab73	Moved isTensor to shared + added isTensorAlloc/Static	2026-05-15 00:32:58 +02:00
adrien	f67e9d709d	Working add TensorAlloc	2026-05-15 00:24:39 +02:00
adrien	e6d0f62929	TensorAlloc add and to compilable but still error for basic add test	2026-05-14 22:25:35 +02:00
adrien	f702c1e09a	slice can now use null value like python [2:]	2026-05-14 10:56:26 +02:00
adrien	b959f5f28a	Added slice to TensorStatic	2026-05-14 01:28:24 +02:00
adrien	6ba1e664c1	Started to add TensorAlloc	2026-05-14 00:53:05 +02:00
adrien	6559ed9f62	Removed comptime to parseSegment	2026-05-12 09:06:28 +02:00
adrien	55906e0ab7	Small fixs	2026-05-11 17:12:37 +02:00
adrien	7d28de2028	Removed comptime for str UnitParser	2026-05-04 23:55:00 +02:00
adrien	eb3b0d4de3	Update .zon	2026-05-04 22:59:54 +02:00
adrien	5bdc78c065	Simplified pow	2026-05-04 22:57:53 +02:00
adrien	18830c8b45	Fixed benchmark	2026-05-04 22:25:18 +02:00
adrien	4595397e70	Removed the feature where you can use comptime int or float ar rhs for operation	2026-05-04 22:10:55 +02:00
adrien	7844aacfce	Added a UnitParser to get Dimensions and Scales from a str	2026-05-04 19:10:06 +02:00
adrien	9b6cd4b377	Removed release fast	2026-05-04 14:34:31 +02:00
adrien	4d275dca2d	Renamed Tensor to TensorStatic to later introduce TensorAlloc and TensorGPU	2026-04-29 18:07:13 +02:00
adrien	9635cfb481	Changed self: Self to self: *const SElf in tensor for performance	2026-04-28 16:06:13 +02:00
adrien	f0029449f0	tmp	2026-04-28 14:50:08 +02:00
adrien	8816a65518	Now pass all test with new *const way I am not quite sure about it yet, but it is faster sooo idk. Let's see long term	2026-04-28 13:51:10 +02:00
adrien	26ff02c50f	Changed TEnsor to use *const	2026-04-28 13:10:14 +02:00
adrien	bb6dd59b9a	Removed more	2026-04-28 01:02:30 +02:00
adrien	acb908a448	Removed some char	2026-04-28 01:01:40 +02:00
adrien	d4a1054fdc	Removed deploy.yaml	2026-04-28 00:58:24 +02:00
adrien	fb2a6f4806	Removed docs/	2026-04-28 00:57:50 +02:00
adrien	8c77ab86f8	Readded it but also in gitignore	2026-04-28 00:56:42 +02:00
adrien	8565869919	Removed mkdocs.yaml	2026-04-28 00:56:02 +02:00
adrien	1a69b3dbf2	Removed old .md	2026-04-28 00:55:32 +02:00