let me know proper way to execute the program using ocelot.
{
ocelot: "ocelot",
trace: {
database: "traces/database.trace",
memoryChecker: {
enabled: false,
checkInitialization: false
},
raceDetector: {
enabled: false,
ignoreIrrelevantWrites: false
},
debugger: {
enabled: false,
kernelFilter: "",
alwaysAttach: true
}
},
cuda: {
implementation: "CudaRuntime",
tracePath: "trace/CudaAPI.trace"
},
executive: {
devices: [emulated],
optimizationLevel: full,
defaultDeviceID: 0,
asynchronousKernelLaunch: True,
port: 2011,
host: "127.0.0.1",
workerThreadLimit: 2,
warpSize: 32
},
optimizations: {
subkernelSize: 10000,
}
}