Exemplo n.º 1
0
  /**
   * This method frees specific chunk of memory, described by AllocationPoint passed in
   *
   * @param point
   */
  @Override
  public void free(AllocationPoint point) {
    switch (point.getAllocationStatus()) {
      case HOST:
        {
          // cudaFreeHost call here
          // FIXME: it would be nice to get rid of typecasting here
          long reqMem = AllocationUtils.getRequiredMemory(point.getShape());

          //  log.info("Deallocating {} bytes on [HOST]", reqMem);

          NativeOps nativeOps = NativeOpsHolder.getInstance().getDeviceNativeOps();

          long result = nativeOps.freeHost(point.getPointers().getHostPointer().address());
          // JCuda.cudaFreeHost(new Pointer(point.getPointers().getHostPointer().address()));
          if (result == 0) throw new RuntimeException("Can't deallocate [HOST] memory...");
        }
        break;
      case DEVICE:
        {
          // cudaFree call
          // JCuda.cudaFree(new Pointer(point.getPointers().getDevicePointer().address()));

          long reqMem = AllocationUtils.getRequiredMemory(point.getShape());

          //       log.info("Deallocating {} bytes on [DEVICE]", reqMem);

          NativeOps nativeOps = NativeOpsHolder.getInstance().getDeviceNativeOps();

          long result = nativeOps.freeDevice(point.getPointers().getDevicePointer().address(), 0);
          if (result == 0) throw new RuntimeException("Can't deallocate [DEVICE] memory...");
        }
        break;
      default:
        throw new IllegalStateException(
            "Can't free memory on target [" + point.getAllocationStatus() + "]");
    }
  }
Exemplo n.º 2
0
  /**
   * This method provides PointersPair to memory chunk specified by AllocationShape
   *
   * @param shape shape of desired memory chunk
   * @param point target AllocationPoint structure
   * @param location either HOST or DEVICE
   * @return
   */
  @Override
  public PointersPair malloc(
      AllocationShape shape, AllocationPoint point, AllocationStatus location) {
    switch (location) {
      case HOST:
        {
          Pointer devicePointer = new Pointer();
          long reqMem = AllocationUtils.getRequiredMemory(shape);

          //     log.info("Allocating {} bytes on [HOST]", reqMem);

          // FIXME: this is WRONG, and directly leads to memleak
          if (reqMem < 1) reqMem = 1;

          long pointer = nativeOps.mallocHost(reqMem, 0);
          if (pointer == 0) throw new RuntimeException("Can't allocate [HOST] memory: " + reqMem);

          Pointer hostPointer = new CudaPointer(pointer);
          /*
                          JCuda.cudaHostGetDevicePointer(
                                  devicePointer,
                                  hostPointer,
                                  0);
          */
          PointersPair devicePointerInfo = new PointersPair();
          devicePointerInfo.setDevicePointer(new CudaPointer(hostPointer, reqMem));
          devicePointerInfo.setHostPointer(new CudaPointer(hostPointer, reqMem));

          point.setPointers(devicePointerInfo);

          point.setAllocationStatus(AllocationStatus.HOST);
          return devicePointerInfo;
        }
      case DEVICE:
        {
          // cudaMalloc call

          long reqMem = AllocationUtils.getRequiredMemory(shape);

          //              log.info("Allocating {} bytes on [DEVICE]", reqMem);

          // FIXME: this is WRONG, and directly leads to memleak
          if (reqMem < 1) reqMem = 1;
          /*
                          if (reqMem == 65536 || reqMem == 1048576 || reqMem == 262144)
                              emergencyCounter.incrementAndGet();

                          if (emergencyCounter.get() > 2000)
                              throw new RuntimeException("PEW");
          */
          // FIXME: it would be nice to get rid of typecasting here

          long pointer = nativeOps.mallocDevice(reqMem, 0, 0);
          if (pointer == 0) return null;
          // throw new RuntimeException("Can't allocate [DEVICE] memory!");

          Pointer devicePointer = new CudaPointer(pointer);

          PointersPair devicePointerInfo = point.getPointers();
          if (devicePointerInfo == null) devicePointerInfo = new PointersPair();
          devicePointerInfo.setDevicePointer(new CudaPointer(devicePointer, reqMem));

          point.setAllocationStatus(AllocationStatus.DEVICE);

          return devicePointerInfo;
        }
      default:
        throw new IllegalStateException("Unsupported location for malloc: [" + location + "]");
    }
  }