Changeset 3117 in CLRX


Ignore:
Timestamp:
Jun 1, 2017, 6:42:23 PM (19 months ago)
Author:
matszpk
Message:

CLRadeonExtender: AmdCL2Bin: Fix for tidig_comp_cnt count in PgmRSRC2 for GFX9 (AMD VEGA arch).

File:
1 edited

Legend:

Unmodified
Added
Removed
  • CLRadeonExtender/trunk/amdbin/AmdCL2BinGen.cpp

    r3056 r3117  
    11151115
    11161116static uint32_t calculatePgmRSRC2(const AmdCL2KernelConfig& config,
    1117                   bool storeLocalSize = false)
     1117                GPUArchitecture arch, bool storeLocalSize = false)
    11181118{
    11191119    uint32_t dimValues = 0;
     
    11211121    {
    11221122        dimValues = ((config.dimMask&7)<<7);
    1123         if (!config.useEnqueue)
     1123        if (!config.useEnqueue || arch==GPUArchitecture::GCN1_4)
     1124            // useenqueue in GFX9 is enabled by default ???
    11241125            dimValues |= (((config.dimMask&4) ? 2 : (config.dimMask&2) ? 1 : 0)<<11);
    11251126        else // enqueue needs TIDIG_COMP_CNT=2 ????
     
    11751176        setup1 = 0x9;
    11761177   
    1177     SLEV(setupData.pgmRSRC2, calculatePgmRSRC2(config));
     1178    SLEV(setupData.pgmRSRC2, calculatePgmRSRC2(config, arch));
    11781179   
    11791180    SLEV(setupData.setup1, setup1);
     
    15091510    }
    15101511    fob.fill(0xa8-sizeof(IntAmdCL2StubEnd), 0);
    1511     fob.writeObject(LEV(calculatePgmRSRC2(config, true)));
     1512    fob.writeObject(LEV(calculatePgmRSRC2(config, arch, true)));
    15121513    fob.fill(0xc0-0xac, 0);
    15131514}
Note: See TracChangeset for help on using the changeset viewer.