GPU Calc: reflect the true cost of InterpretTail more accurately.
Change-Id: I7004150569e5329f19d2f08adbd70477bd6252ff
This commit is contained in:
@@ -376,9 +376,17 @@ ds_status evaluateScoreForDevice(ds_device* device, void* evalData)
|
|||||||
testData->output[j] = fAverage + (fMin * fSoP);
|
testData->output[j] = fAverage + (fMin * fSoP);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// InterpretTail - the S/W fallback is nothing like as efficient
|
||||||
|
// as any good openCL implementation: no SIMD, tons of branching
|
||||||
|
// in the inner loops etc. Generously characterise it as only 10x
|
||||||
|
// slower than the above.
|
||||||
|
float fInterpretTailFactor = 10.0;
|
||||||
|
|
||||||
device->score = (void*)new LibreOfficeDeviceScore;
|
device->score = (void*)new LibreOfficeDeviceScore;
|
||||||
((LibreOfficeDeviceScore*)device->score)->fTime = timerCurrent(&kernelTime);
|
((LibreOfficeDeviceScore*)device->score)->fTime = timerCurrent(&kernelTime);
|
||||||
((LibreOfficeDeviceScore*)device->score)->bNoCLErrors = true;
|
((LibreOfficeDeviceScore*)device->score)->bNoCLErrors = true;
|
||||||
|
|
||||||
|
((LibreOfficeDeviceScore*)device->score)->fTime *= fInterpretTailFactor;
|
||||||
}
|
}
|
||||||
return DS_SUCCESS;
|
return DS_SUCCESS;
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user