reference, declarationdefinition
definition → references, declarations, derived classes, virtual overrides
reference to multiple definitions → definitions
unreferenced
    1
    2
    3
    4
    5
    6
    7
    8
    9
   10
   11
   12
   13
   14
   15
   16
   17
   18
   19
   20
   21
   22
   23
   24
   25
   26
   27
   28
   29
   30
   31
   32
   33
   34
   35
   36
   37
   38
   39
   40
   41
   42
   43
   44
   45
   46
   47
   48
   49
   50
   51
   52
   53
   54
   55
   56
   57
   58
   59
   60
   61
   62
   63
   64
   65
   66
   67
   68
   69
   70
   71
   72
   73
   74
   75
   76
   77
   78
   79
   80
   81
   82
   83
   84
   85
   86
// RUN: %libomptarget-compile-run-and-check-aarch64-unknown-linux-gnu
// RUN: %libomptarget-compile-run-and-check-powerpc64-ibm-linux-gnu
// RUN: %libomptarget-compile-run-and-check-powerpc64le-ibm-linux-gnu
// RUN: %libomptarget-compile-run-and-check-x86_64-pc-linux-gnu

#include <omp.h>
#include <stdio.h>

// ---------------------------------------------------------------------------
// Various definitions copied from OpenMP RTL

extern void __tgt_register_requires(int64_t);

extern void __tgt_target_data_begin(int64_t device_id, int32_t arg_num,
                                    void **args_base, void **args,
                                    int64_t *arg_sizes, int64_t *arg_types);

extern void __tgt_target_data_end(int64_t device_id, int32_t arg_num,
                                  void **args_base, void **args,
                                  int64_t *arg_sizes, int64_t *arg_types);

// End of definitions copied from OpenMP RTL.
// ---------------------------------------------------------------------------

#pragma omp requires unified_shared_memory

#define N 1024

int main(int argc, char *argv[]) {
  int fails;
  void *host_alloc = 0, *device_alloc = 0;
  int *a = (int *)malloc(N * sizeof(int));

  // Manual registration of requires flags for Clang versions
  // that do not support requires.
  __tgt_register_requires(8);

  // Init
  for (int i = 0; i < N; ++i) {
    a[i] = 10;
  }
  host_alloc = &a[0];

// Dummy target region that ensures the runtime library is loaded when
// the target data begin/end functions are manually called below.
#pragma omp target
  {}

  // Manual calls
  int device_id = omp_get_default_device();
  int arg_num = 1;
  void **args_base = (void **)&a;
  void **args = (void **)&a;
  int64_t arg_sizes[arg_num];

  arg_sizes[0] = sizeof(int) * N;

  int64_t arg_types[arg_num];

  // Ox400 enables the CLOSE map type in the runtime:
  // OMP_TGT_MAPTYPE_CLOSE = 0x400
  // OMP_TGT_MAPTYPE_TO    = 0x001
  arg_types[0] = 0x400 | 0x001;

  device_alloc = host_alloc;

  __tgt_target_data_begin(device_id, arg_num, args_base, args, arg_sizes,
                          arg_types);

#pragma omp target data use_device_ptr(a)
  { device_alloc = a; }

  __tgt_target_data_end(device_id, arg_num, args_base, args, arg_sizes,
                        arg_types);

  // CHECK: a was copied to the device
  if (device_alloc != host_alloc)
    printf("a was copied to the device\n");

  free(a);

  // CHECK: Done!
  printf("Done!\n");

  return 0;
}