// Metal definitions
#define NS_PRIVATE_IMPLEMENTATION
#define CA_PRIVATE_IMPLEMENTATION
#define MTL_PRIVATE_IMPLEMENTATION

#include 
#include 

#include 
#include 
#include 
#include 

class Timer
{
    private:
        std::chrono::high_resolution_clock::time_point start_time;
    public:
        Timer() {}
        void begin() {start_time = std::chrono::high_resolution_clock::now();}
        void end(const char * str = &#34;Duration: &#34;)
        {
            auto end_time = std::chrono::high_resolution_clock::now();
            std::chrono::duration duration = end_time - start_time;
            printf(&#34;%s%.6f ms\n&#34;, str, duration.count());
        }
};

int main()
{
    Timer t,tt;
    
    NS::Error* error;
    auto gpuHandler = MTL::CreateSystemDefaultDevice();
    auto commandQueue = gpuHandler-&gt;newCommandQueue();
    auto gpuFunctionsLibrary = gpuHandler-&gt;newLibrary(NS::String::string(&#34;kernel void dummyKernel(){}&#34;, NS::ASCIIStringEncoding), nullptr, &amp;error);
    auto functionName = NS::String::string(&#34;dummyKernel&#34;, NS::ASCIIStringEncoding);
    auto gpuFunction = gpuFunctionsLibrary-&gt;newFunction(functionName);
    auto computePipelineState = gpuHandler-&gt;newComputePipelineState(gpuFunction, &amp;error);
    auto gridSize = MTL::Size::Make(1,1,1);
    auto groupSize = MTL::Size::Make(32,1,1);

    tt.begin();
    for(int k = 0; k &lt; 100; k += 1)
    {
        t.begin();
        auto commandBuffer = commandQueue-&gt;commandBuffer();
        auto commandEncoder = commandBuffer-&gt;computeCommandEncoder();
        commandEncoder-&gt;setComputePipelineState(computePipelineState);
        commandEncoder-&gt;dispatchThreadgroups(gridSize, groupSize);
        commandEncoder-&gt;endEncoding();
        t.end(&#34;Encoding: &#34;);
        
        t.begin();
        commandBuffer-&gt;commit();
        t.end(&#34;Commit:   &#34;);
        
        t.begin();
        commandBuffer-&gt;waitUntilCompleted();
        t.end(&#34;Wait:     &#34;);
        
        double gpuTimeSec = commandBuffer-&gt;GPUEndTime() - commandBuffer-&gt;GPUStartTime();
        printf(&#34;GPU:      %.6f ms\n&#34;, gpuTimeSec * 1000);
        
        printf(&#34;---\n&#34;);
        
        //commandBuffer-&gt;release();
        //commandEncoder-&gt;release();
    }
    tt.end(&#34;Total: &#34;);
}