static int load_maps(struct bpf_map_data *maps, int nr_maps,
                     fixup_map_cb fixup_map)
 {
-       int i;
+       int i, numa_node;
 
        for (i = 0; i < nr_maps; i++) {
                if (fixup_map) {
                        }
                }
 
+               numa_node = maps[i].def.map_flags & BPF_F_NUMA_NODE ?
+                       maps[i].def.numa_node : -1;
+
                if (maps[i].def.type == BPF_MAP_TYPE_ARRAY_OF_MAPS ||
                    maps[i].def.type == BPF_MAP_TYPE_HASH_OF_MAPS) {
                        int inner_map_fd = map_fd[maps[i].def.inner_map_idx];
 
-                       map_fd[i] = bpf_create_map_in_map(maps[i].def.type,
+                       map_fd[i] = bpf_create_map_in_map_node(maps[i].def.type,
                                                        maps[i].def.key_size,
                                                        inner_map_fd,
                                                        maps[i].def.max_entries,
-                                                       maps[i].def.map_flags);
+                                                       maps[i].def.map_flags,
+                                                       numa_node);
                } else {
-                       map_fd[i] = bpf_create_map(maps[i].def.type,
-                                                  maps[i].def.key_size,
-                                                  maps[i].def.value_size,
-                                                  maps[i].def.max_entries,
-                                                  maps[i].def.map_flags);
+                       map_fd[i] = bpf_create_map_node(maps[i].def.type,
+                                                       maps[i].def.key_size,
+                                                       maps[i].def.value_size,
+                                                       maps[i].def.max_entries,
+                                                       maps[i].def.map_flags,
+                                                       numa_node);
                }
                if (map_fd[i] < 0) {
                        printf("failed to create a map: %d %s\n",
 
        unsigned int max_entries;
        unsigned int map_flags;
        unsigned int inner_map_idx;
+       unsigned int numa_node;
 };
 
 struct bpf_map_data {
 
        .key_size = sizeof(u32),
        .value_size = sizeof(long),
        .max_entries = MAX_ENTRIES,
+       .map_flags = BPF_F_NUMA_NODE,
+       .numa_node = 0,
 };
 
 struct bpf_map_def SEC("maps") array_of_lru_hashs = {
 
 
        if (test == INNER_LRU_HASH_PREALLOC) {
                int outer_fd = map_fd[array_of_lru_hashs_idx];
+               unsigned int mycpu, mynode;
 
                assert(cpu < MAX_NR_CPUS);
 
                if (cpu) {
+                       ret = syscall(__NR_getcpu, &mycpu, &mynode, NULL);
+                       assert(!ret);
+
                        inner_lru_map_fds[cpu] =
-                               bpf_create_map(BPF_MAP_TYPE_LRU_HASH,
-                                              sizeof(uint32_t), sizeof(long),
-                                              inner_lru_hash_size, 0);
+                               bpf_create_map_node(BPF_MAP_TYPE_LRU_HASH,
+                                                   sizeof(uint32_t),
+                                                   sizeof(long),
+                                                   inner_lru_hash_size, 0,
+                                                   mynode);
                        if (inner_lru_map_fds[cpu] == -1) {
                                printf("cannot create BPF_MAP_TYPE_LRU_HASH %s(%d)\n",
                                       strerror(errno), errno);
 
 #define BPF_NOEXIST    1 /* create new element if it didn't exist */
 #define BPF_EXIST      2 /* update existing element */
 
+/* flags for BPF_MAP_CREATE command */
 #define BPF_F_NO_PREALLOC      (1U << 0)
 /* Instead of having one common LRU list in the
  * BPF_MAP_TYPE_LRU_[PERCPU_]HASH map, use a percpu LRU list
  * across different LRU lists.
  */
 #define BPF_F_NO_COMMON_LRU    (1U << 1)
+/* Specify numa node during map creation */
+#define BPF_F_NUMA_NODE                (1U << 2)
 
 union bpf_attr {
        struct { /* anonymous struct used by BPF_MAP_CREATE command */
                __u32   key_size;       /* size of key in bytes */
                __u32   value_size;     /* size of value in bytes */
                __u32   max_entries;    /* max number of entries in a map */
-               __u32   map_flags;      /* prealloc or not */
+               __u32   map_flags;      /* BPF_MAP_CREATE related
+                                        * flags defined above.
+                                        */
                __u32   inner_map_fd;   /* fd pointing to the inner map */
+               __u32   numa_node;      /* numa node (effective only if
+                                        * BPF_F_NUMA_NODE is set).
+                                        */
        };
 
        struct { /* anonymous struct used by BPF_MAP_*_ELEM commands */
 
        return syscall(__NR_bpf, cmd, attr, size);
 }
 
-int bpf_create_map(enum bpf_map_type map_type, int key_size,
-                  int value_size, int max_entries, __u32 map_flags)
+int bpf_create_map_node(enum bpf_map_type map_type, int key_size,
+                       int value_size, int max_entries, __u32 map_flags,
+                       int node)
 {
        union bpf_attr attr;
 
        attr.value_size = value_size;
        attr.max_entries = max_entries;
        attr.map_flags = map_flags;
+       if (node >= 0) {
+               attr.map_flags |= BPF_F_NUMA_NODE;
+               attr.numa_node = node;
+       }
 
        return sys_bpf(BPF_MAP_CREATE, &attr, sizeof(attr));
 }
 
-int bpf_create_map_in_map(enum bpf_map_type map_type, int key_size,
-                         int inner_map_fd, int max_entries, __u32 map_flags)
+int bpf_create_map(enum bpf_map_type map_type, int key_size,
+                  int value_size, int max_entries, __u32 map_flags)
+{
+       return bpf_create_map_node(map_type, key_size, value_size,
+                                  max_entries, map_flags, -1);
+}
+
+int bpf_create_map_in_map_node(enum bpf_map_type map_type, int key_size,
+                              int inner_map_fd, int max_entries,
+                              __u32 map_flags, int node)
 {
        union bpf_attr attr;
 
        attr.inner_map_fd = inner_map_fd;
        attr.max_entries = max_entries;
        attr.map_flags = map_flags;
+       if (node >= 0) {
+               attr.map_flags |= BPF_F_NUMA_NODE;
+               attr.numa_node = node;
+       }
 
        return sys_bpf(BPF_MAP_CREATE, &attr, sizeof(attr));
 }
 
+int bpf_create_map_in_map(enum bpf_map_type map_type, int key_size,
+                         int inner_map_fd, int max_entries, __u32 map_flags)
+{
+       return bpf_create_map_in_map_node(map_type, key_size, inner_map_fd,
+                                         max_entries, map_flags, -1);
+}
+
 int bpf_load_program(enum bpf_prog_type type, const struct bpf_insn *insns,
                     size_t insns_cnt, const char *license,
                     __u32 kern_version, char *log_buf, size_t log_buf_sz)
 
 #include <linux/bpf.h>
 #include <stddef.h>
 
+int bpf_create_map_node(enum bpf_map_type map_type, int key_size,
+                       int value_size, int max_entries, __u32 map_flags,
+                       int node);
 int bpf_create_map(enum bpf_map_type map_type, int key_size, int value_size,
                   int max_entries, __u32 map_flags);
+int bpf_create_map_in_map_node(enum bpf_map_type map_type, int key_size,
+                              int inner_map_fd, int max_entries,
+                              __u32 map_flags, int node);
 int bpf_create_map_in_map(enum bpf_map_type map_type, int key_size,
                          int inner_map_fd, int max_entries, __u32 map_flags);
 
 
        unsigned int max_entries;
        unsigned int map_flags;
        unsigned int inner_map_idx;
+       unsigned int numa_node;
 };
 
 static int (*bpf_skb_load_bytes)(void *ctx, int off, void *to, int len) =