Python estimate_regs_per_threadの例、loopy.statistics.estimate_regs_per_thread Pythonの例

コード例 #1

0

ファイルを表示

ファイル: test_perf_model.py プロジェクト: jdsteve2/performance_prediction

def test_reg_counter_reduction():

    knl = lp.make_kernel(
            "{[i,k,j]: 0<=i<n and 0<=k<m and 0<=j<l}",
            [
                "c[i, j] = sum(k, a[i, k]*b[k, j])"
            ],
            name="matmul_serial", assumptions="n,m,l >= 1")

    knl = lp.add_and_infer_dtypes(knl, dict(a=np.float32, b=np.float32))
    regs = estimate_regs_per_thread(knl)
    assert regs == 6

コード例 #2

0

ファイルを表示

ファイル: test_perf_model.py プロジェクト: jdsteve2/performance_prediction

def test_reg_counter_logic():

    knl = lp.make_kernel(
            "{[i,k,j]: 0<=i<n and 0<=k<m and 0<=j<l}",
            [
                """
                e[i,k] = if(not(k<l-2) and k>6 or k/2==l, g[i,k]*2, g[i,k]+h[i,k]/2)
                """
            ],
            name="logic", assumptions="n,m,l >= 1")

    knl = lp.add_and_infer_dtypes(knl, dict(g=np.float32, h=np.float64))
    regs = estimate_regs_per_thread(knl)
    assert regs == 6

コード例 #3

0

ファイルを表示

ファイル: test_perf_model.py プロジェクト: jdsteve2/performance_prediction

def test_reg_counter_specialops():

    knl = lp.make_kernel(
            "{[i,k,j]: 0<=i<n and 0<=k<m and 0<=j<l}",
            [
                """
                c[i, j, k] = (2*a[i,j,k])%(2+b[i,j,k]/3.0)
                e[i, k] = (1+g[i,k])**(1+h[i,k+1])
                """
            ],
            name="specialops", assumptions="n,m,l >= 1")

    knl = lp.add_and_infer_dtypes(knl,
                        dict(a=np.float32, b=np.float32, g=np.float64, h=np.float64))
    regs = estimate_regs_per_thread(knl)
    assert regs == 6

コード例 #4

0

ファイルを表示

ファイル: test_perf_model.py プロジェクト: jdsteve2/performance_prediction

def test_reg_counter_basic():

    knl = lp.make_kernel(
            "[n,m,l] -> {[i,k,j]: 0<=i<n and 0<=k<m and 0<=j<l}",
            [
                """
                c[i, j, k] = a[i,j,k]*b[i,j,k]/3.0+a[i,j,k]
                e[i, k+1] = g[i,k]*h[i,k+1]
                """
            ],
            name="basic", assumptions="n,m,l >= 1")

    knl = lp.add_and_infer_dtypes(knl,
                        dict(a=np.float32, b=np.float32, g=np.float64, h=np.float64))
    regs = estimate_regs_per_thread(knl)
    assert regs == 6

コード例 #5

0

ファイルを表示

ファイル: test_perf_model.py プロジェクト: jdsteve2/performance_prediction

def test_reg_counter_bitwise():

    knl = lp.make_kernel(
            "{[i,k,j]: 0<=i<n and 0<=k<m and 0<=j<l}",
            [
                """
                c[i, j, k] = (a[i,j,k] | 1) + (b[i,j,k] & 1)
                e[i, k] = (g[i,k] ^ k)*(~h[i,k+1]) + (g[i, k] << (h[i,k] >> k))
                """
            ],
            name="bitwise", assumptions="n,m,l >= 1")

    knl = lp.add_and_infer_dtypes(
            knl, dict(
                a=np.int32, b=np.int32,
                g=np.int64, h=np.int64))
    regs = estimate_regs_per_thread(knl)
    assert regs == 6

コード例 #6

0

ファイルを表示