Skip to content

Instantly share code, notes, and snippets.

@bjourne
Created November 15, 2024 13:59
Show Gist options
  • Select an option

  • Save bjourne/8f705c5879aa966accf354008623f6bb to your computer and use it in GitHub Desktop.

Select an option

Save bjourne/8f705c5879aa966accf354008623f6bb to your computer and use it in GitHub Desktop.

Revisions

  1. bjourne created this gist Nov 15, 2024.
    361 changes: 361 additions & 0 deletions repr.cl
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,361 @@
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {

    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {

    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {

    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {

    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    __kernel void
    foo(
    uint dc_dim, uint sc_dim,
    uint fy_dim, uint fx_dim,
    __global const float * restrict F,
    uint sy_dim, uint sx_dim,
    __global const float * restrict S,
    uint padding,
    __global float * restrict D
    ) {
    uint dy_dim = sy_dim + 2 * padding - fy_dim + 1;
    uint dx_dim = sx_dim + 2 * padding - fx_dim + 1;

    uint dn = dc_dim * dy_dim * dx_dim;
    uint sn = sc_dim * sy_dim * sx_dim;
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }
    }