/ - Diff - Bench4GPU - Forge du Centre Blaise Pascal

Révision 202

       for i in range(steps):
         start_time=time.time()
         Splutter[:]=0
         print Splutter,len(Splutter)
-...
         stop.record()
         stop.synchronize()
         elapsed = start.time_till(stop)*1e-3
     #    elapsed = start.time_till(stop)*1e-3
         elapsed = time.time()-start_time
         print Splutter,sum(Splutter)
         MySplutter[i]=numpy.median(Splutter)
-...
         # Default Device selection based on ALU Type
         for platform in cl.get_platforms():
           for device in platform.get_devices():
             deviceType=cl.device_type.to_string(device.type)
             #deviceType=cl.device_type.to_string(device.type)
             deviceMemory=device.max_mem_alloc_size
             if deviceMemory>MaxMemoryXPU:
               MaxMemoryXPU=deviceMemory
             if deviceMemory<MinMemoryXPU or MinMemoryXPU==0:
               MinMemoryXPU=deviceMemory
             if deviceType=="GPU" and Alu=="GPU" and not HasXPU:
             if not HasXPU:
               XPU=device
               print "GPU selected with Allocable Memory %i: %s" % (deviceMemory,device.name)
               print "XPU selected with Allocable Memory %i: %s" % (deviceMemory,device.name)
               HasXPU=True
               MemoryXPU=deviceMemory
             if deviceType=="CPU" and Alu=="CPU" and not HasXPU:
               XPU=device
               print "CPU selected with Allocable Memory %i: %s" % (deviceMemory,device.name)
               HasXPU=True
               MemoryXPU=deviceMemory
       else:
         print "Enter XPU selector based on device number & ALU type"
-...
         # Primary Device selection based on Device Id
         for platform in cl.get_platforms():
           for device in platform.get_devices():
             deviceType=cl.device_type.to_string(device.type)
             #deviceType=cl.device_type.to_string(device.type)
             deviceMemory=device.max_mem_alloc_size
             if deviceMemory>MaxMemoryXPU:
               MaxMemoryXPU=deviceMemory
             if deviceMemory<MinMemoryXPU or MinMemoryXPU==0:
               MinMemoryXPU=deviceMemory
             if Id==Device and Alu==deviceType and HasXPU==False:
             if Id==Device  and HasXPU==False:
               XPU=device
               print "CPU/GPU selected with Allocable Memory %i: %s" % (deviceMemory,device.name)
               HasXPU=True
-...
         print Splutter,len(Splutter)
         h2d_time=time.time()
         SplutterCL = cl.Buffer(ctx, mf.WRITE_ONLY|mf.COPY_HOST_PTR,hostbuf=Splutter)
         print('From Host to Device time %f' % (time.time()-h2d_time))
         start_time=time.time()
         if ParaStyle=='Blocks':
           # Call OpenCL kernel
           # (1,) is Global work size (only 1 work size)
-...
           print "%s with %i %s done" % (Alu,jobs,ParaStyle)
         CLLaunch.wait()
         d2h_time=time.time()
         cl.enqueue_copy(queue, Splutter, SplutterCL).wait()
         print('From Device to Host %f' % (time.time()-d2h_time))
     #    elapsed = 1e-9*(CLLaunch.profile.end - CLLaunch.profile.start)
         elapsed = time.time()-start_time
         print('Elapsed compute time %f' % elapsed)
         elapsed = 1e-9*(CLLaunch.profile.end - CLLaunch.profile.start)
         MyDuration[i]=elapsed
         print Splutter,sum(Splutter)
         #print Splutter,sum(Splutter)
         #MySplutter[i]=numpy.median(Splutter)
         #print numpy.mean(Splutter)*len(Splutter),MySplutter[i]*len(Splutter),numpy.std(Splutter)
-...
             Id=1
             for platform in cl.get_platforms():
               for device in platform.get_devices():
                 deviceType=cl.device_type.to_string(device.type)
                 #deviceType=cl.device_type.to_string(device.type)
                 deviceMemory=device.max_mem_alloc_size
                 print "Device #%i from %s of type %s with memory %i : %s" % (Id,platform.vendor,deviceType,deviceMemory,device.name.lstrip())
                 print "Device #%i from %s with memory %i : %s" % (Id,platform.vendor,deviceMemory,device.name.lstrip())
                 Id=Id+1
             print
-...
           Id=1
           for platform in cl.get_platforms():
             for device in platform.get_devices():
               deviceType=cl.device_type.to_string(device.type)
               print "Device #%i of type %s : %s" % (Id,deviceType,device.name)
               #deviceType=cl.device_type.to_string(device.type)
               print "Device #%i : %s" % (Id,device.name)
               if Id == Device:
                 # Set the Alu as detected Device Type
                 Alu=deviceType
                 Alu='xPU'
               Id=Id+1
         except ImportError:
           print "Platform does not seem to support CUDA"

Formats disponibles : Unified diff

Centre Blaise Pascal » Bench4GPU

Révision 202