intel · Taogle2018 · Jan 24, 2018 · Mar 21, 2018 · raphaelning · Mar 22, 2018
diff --git a/core/ept2.c b/core/ept2.c
@@ -70,7 +70,8 @@ void ept_handle_mapping_changed(hax_gpa_space_listener *listener,
 }
 
 int ept_handle_access_violation(hax_gpa_space *gpa_space, hax_ept_tree *tree,
-                                exit_qualification_t qual, uint64 gpa)
+                                exit_qualification_t qual, uint64 gpa,
+                                uint64 *fault_gfn)
 {
     uint combined_perm;
     uint64 gfn;
@@ -102,6 +103,9 @@ int ept_handle_access_violation(hax_gpa_space *gpa_space, hax_ept_tree *tree,
         return 0;
     }
 
+    if (gpa_space_chunk_protected(gpa_space, gfn, fault_gfn))
+        return -EPERM;
+
     // The faulting GPA maps to RAM/ROM
     is_rom = slot->flags & HAX_MEMSLOT_READONLY;
     offset_within_slot = gpa - (slot->base_gfn << PG_ORDER_4K);

diff --git a/core/gpa_space.c b/core/gpa_space.c
@@ -33,6 +33,7 @@
 #include "../include/hax.h"
 #include "include/paging.h"
 #include "../include/hax_host_mem.h"
+#include "ept2.h"
 
 int gpa_space_init(hax_gpa_space *gpa_space)
 {
@@ -59,6 +60,13 @@ int gpa_space_init(hax_gpa_space *gpa_space)
     return ret;
 }
 
+static uint64 gpa_space_prot_bitmap_size(uint64 npages)
+{
+    uint64 bitmap_size = (npages + 7)/8;
+    bitmap_size += 8;
+    return bitmap_size;
+}
+
 void gpa_space_free(hax_gpa_space *gpa_space)
 {
     hax_gpa_space_listener *listener, *tmp;
@@ -75,6 +83,9 @@ void gpa_space_free(hax_gpa_space *gpa_space)
                                  hax_gpa_space_listener, entry) {
         hax_list_del(&listener->entry);
     }
+    if (gpa_space->prot_bitmap.bitmap)
+        hax_vfree(gpa_space->prot_bitmap.bitmap,
+                  gpa_space_prot_bitmap_size(gpa_space->prot_bitmap.max_gpfn));
 }
 
 void gpa_space_add_listener(hax_gpa_space *gpa_space,
@@ -346,3 +357,118 @@ uint64 gpa_space_get_pfn(hax_gpa_space *gpa_space, uint64 gfn, uint8 *flags)
 
     return pfn;
 }
+
+int gpa_space_adjust_prot_bitmap(hax_gpa_space *gpa_space, uint64 max_gpfn)
+{
+    prot_bitmap *pb = &gpa_space->prot_bitmap;
+    uint8 *bmold = pb->bitmap, *bmnew = NULL;
+
+    /* Bitmap size only grows until it is destroyed */
+    if (max_gpfn <= pb->max_gpfn)
+        return 0;
+
+    bmnew = hax_vmalloc(gpa_space_prot_bitmap_size(max_gpfn), HAX_MEM_NONPAGE);
+    if (!bmnew) {
+        hax_error("%s: Not enought memory for new protection bitmap\n",
+                  __func__);
+        return -ENOMEM;
+    }
+    pb->bitmap = bmnew;
+    if (bmold) {
+        memcpy(bmnew, bmold, gpa_space_prot_bitmap_size(pb->max_gpfn));
+        hax_vfree(bmold, gpa_space_prot_bitmap_size(pb->max_gpfn));
+    }
+    pb->max_gpfn = max_gpfn;
+    return 0;
+}
+
+static void gpa_space_set_prot_bitmap(uint64 start, uint64 nbits,
+                                      uint8 *bitmap, bool set)
+{
+    uint64 i = 0;
+    uint64 start_index = start / 8;
+    uint64 start_bit = start % 8;
+    uint64 end_index = (start + nbits) / 8;
+    uint64 end_bit = (start + nbits) % 8;
+
+    if (start_index == end_index) {
+        for (i = start; i < start + nbits; i++)
+            if (set)
+                hax_test_and_set_bit(i, (uint64 *)bitmap);
+            else
+                hax_test_and_clear_bit(i, (uint64 *)bitmap);
+        return;
+    }
+
+    for (i = start; i < (start_index + 1) * 8; i++)
+        if (set)
+            hax_test_and_set_bit(i, (uint64 *)bitmap);
+        else
+            hax_test_and_clear_bit(i, (uint64 *)bitmap);
+
+    for (i = end_index * 8; i < start + nbits; i++)
+        if (set)
+            hax_test_and_set_bit(i, (uint64 *)bitmap);
+        else
+            hax_test_and_clear_bit(i, (uint64 *)bitmap);
+
+    for (i = start_index + 1; i < end_index; i++)
+        if (set)
+            bitmap[i] = 0xFF;
+        else
+            bitmap[i] = 0;
+}
+
+int gpa_space_test_prot_bitmap(struct hax_gpa_space *gpa_space, uint64 gfn)
+{
+    struct prot_bitmap *pbm = &gpa_space->prot_bitmap;
+
+    if (!pbm)
+        return 0;
+
+    if (gfn >= pbm->max_gpfn)
+        return 0;
+
+    return hax_test_bit(gfn, (uint64 *)pbm->bitmap);
+}
+
+int gpa_space_chunk_protected(struct hax_gpa_space *gpa_space, uint64 gfn,
+                              uint64 *fault_gfn)
+{
+    uint64 __gfn = gfn / HAX_CHUNK_NR_PAGES * HAX_CHUNK_NR_PAGES;
+    for (gfn = __gfn; gfn < __gfn + HAX_CHUNK_NR_PAGES; gfn++)
+        if (gpa_space_test_prot_bitmap(gpa_space, gfn)) {
+            *fault_gfn = gfn;
+            return 1;
+        }
+
+    return 0;
+}
+
+int gpa_space_protect_range(struct hax_gpa_space *gpa_space,
+                            struct hax_ept_tree *ept_tree,
+                            uint64 start_gpa, uint64 len, int8 flags)
+{
+    uint64 gfn;
+    uint npages;
+    hax_memslot *slot;
+
+    if (len == 0) {
+        hax_error("%s: len = 0\n", __func__);
+        return -EINVAL;
+    }
+
+    /* Did not support specific prot on r/w/e now */
+    if (flags != 0 && (flags & HAX_GPA_PROT_MASK) != HAX_GPA_PROT_ALL)
+        return -EINVAL;
+
+    gfn = start_gpa >> PG_ORDER_4K;
+    npages = (len + PAGE_SIZE_4K - 1) >> PG_ORDER_4K;
+
+    gpa_space_set_prot_bitmap(gfn, npages, gpa_space->prot_bitmap.bitmap, !flags);
+
+    if (!flags)
+        ept_tree_invalidate_entries(ept_tree, gfn, npages);
+
+    return 0;
+}
diff --git a/core/hax.c b/core/hax.c
@@ -347,6 +347,7 @@ int hax_get_capability(void *buf, int bufLeng, int *outLength)
         cap->winfo |= HAX_CAP_64BIT_SETRAM;
 #endif
         cap->winfo |= HAX_CAP_TUNNEL_PAGE;
+        cap->winfo |= HAX_CAP_GPA_PROTECTION;
         if (cpu_data->vmx_info._ept_cap) {
             cap->winfo |= HAX_CAP_EPT;
         }

diff --git a/core/include/ept2.h b/core/include/ept2.h
@@ -249,7 +249,8 @@ void ept_handle_mapping_changed(hax_gpa_space_listener *listener,
 //          present, but the access violates the permissions it allows.
 // -ENOMEM: Memory allocation/mapping error.
 int ept_handle_access_violation(hax_gpa_space *gpa_space, hax_ept_tree *tree,
-                                exit_qualification_t qual, uint64 gpa);
+                                exit_qualification_t qual, uint64 gpa,
+                                uint64 *fault_gfn);
 
 // Handles an EPT misconfiguration caught by hardware while it tries to
 // translate a GPA.

diff --git a/core/include/hax_core_interface.h b/core/include/hax_core_interface.h
@@ -59,6 +59,7 @@ int hax_vm_set_ram2(struct vm_t *vm, struct hax_set_ram_info2 *info);
 int hax_vm_free_all_ram(struct vm_t *vm);
 int in_pmem_range(struct hax_vcpu_mem *pmem, uint64_t va);
 int hax_vm_add_ramblock(struct vm_t *vm, uint64_t start_uva, uint64_t size);
+int hax_vm_gpa_prot(struct vm_t *vm, struct hax_gpa_prot_info *info);
 
 void * get_vm_host(struct vm_t *vm);
 int set_vm_host(struct vm_t *vm, void *vm_host);

diff --git a/core/include/memory.h b/core/include/memory.h
@@ -36,6 +36,7 @@
 
 #define HAX_CHUNK_SHIFT 21
 #define HAX_CHUNK_SIZE  (1U << HAX_CHUNK_SHIFT)  // 2MB
+#define HAX_CHUNK_NR_PAGES (HAX_CHUNK_SIZE/PAGE_SIZE_4K)
 
 typedef struct hax_chunk {
     hax_memdesc_user memdesc;
@@ -80,12 +81,20 @@ typedef struct hax_memslot {
 // Used only by memslot_set_mapping(), not by any hax_memslot
 #define HAX_MEMSLOT_INVALID  0x80
 
+typedef struct prot_bitmap {
+    // R/W/E Protection Bitmap
+    uint8 *bitmap;
+    // Last gpfn
+    uint64 max_gpfn;
+} prot_bitmap;
+
 typedef struct hax_gpa_space {
     // TODO: Add a lock to prevent concurrent accesses to |ramblock_list| and
     // |memslot_list|
     hax_list_head ramblock_list;
     hax_list_head memslot_list;
     hax_list_head listener_list;
+    prot_bitmap prot_bitmap;
 } hax_gpa_space;
 
 typedef struct hax_gpa_space_listener hax_gpa_space_listener;
@@ -298,6 +307,21 @@ void gpa_space_unmap_page(hax_gpa_space *gpa_space, hax_kmap_user *kmap);
 // MMIO.
 uint64 gpa_space_get_pfn(hax_gpa_space *gpa_space, uint64 gfn, uint8 *flags);
 
+int gpa_space_protect_range(struct hax_gpa_space *gpa_space,
+                            struct hax_ept_tree *ept_tree,
+                            uint64 start_gpa, uint64 len, int8 flags);
+
+// Adjust gpa protection bitmap size. Once a bigger gfn is met, allocate
+// a new bitmap and copy the old bitmap contents.
+// |gpa_space|: The GPA space of the guest.
+// |max_gpfn|: max gfn that the bitmap can hold.
+int gpa_space_adjust_prot_bitmap(struct hax_gpa_space *gpa_space,
+                                 uint64 max_gpfn);
+
+int gpa_space_test_prot_bitmap(struct hax_gpa_space *gpa_space, uint64 gfn);
+int gpa_space_chunk_protected(struct hax_gpa_space *gpa_space, uint64 gfn,
+                              uint64 *fault_gfn);
+
 // Allocates a |hax_chunk| for the given UVA range, and pins the corresponding
 // host page frames in RAM.
 // |base_uva|: The start of the UVA range. Should be page-aligned.

diff --git a/core/include/vm.h b/core/include/vm.h
@@ -109,7 +109,8 @@ enum exit_status {
     HAX_EXIT_HLT,
     HAX_EXIT_STATECHANGE,
     HAX_EXIT_PAUSED,
-    HAX_EXIT_FAST_MMIO
+    HAX_EXIT_FAST_MMIO,
+    HAX_EXIT_GPAPROT
 };
 
 enum run_flag {

diff --git a/core/memory.c b/core/memory.c
@@ -261,6 +261,7 @@ static int handle_set_ram(struct vm_t *vm, uint64 start_gpa, uint64 size,
     gpa_space = &vm->gpa_space;
     start_gfn = start_gpa >> PG_ORDER_4K;
     npages = size >> PG_ORDER_4K;
+    gpa_space_adjust_prot_bitmap(gpa_space, start_gfn + npages);
     ret = memslot_set_mapping(gpa_space, start_gfn, npages, start_uva, flags);
     if (ret) {
         hax_error("%s: memslot_set_mapping() failed: ret=%d, start_gfn=0x%llx,"
@@ -376,6 +377,14 @@ int hax_vm_set_ram2(struct vm_t *vm, struct hax_set_ram_info2 *info)
 }
 #endif  // CONFIG_HAX_EPT2
 
+int hax_vm_gpa_prot(struct vm_t *vm, struct hax_gpa_prot_info *info)
+{
+    uint8_t flags = info->flags;
+
+    return gpa_space_protect_range(&vm->gpa_space, &vm->ept_tree,
+                                   info->pa_start, info->size, info->flags);
+}
+
 int hax_vcpu_setup_hax_tunnel(struct vcpu_t *cv, struct hax_tunnel_info *info)
 {
     int ret = -ENOMEM;

diff --git a/core/vcpu.c b/core/vcpu.c
@@ -3958,6 +3958,7 @@ static int exit_ept_violation(struct vcpu_t *vcpu, struct hax_tunnel *htun)
     paddr_t gpa;
     struct decode dec;
     int ret = 0;
+    uint64 fault_gfn;
 
     htun->_exit_reason = vmx(vcpu, exit_reason).basic_reason;
 
@@ -3972,7 +3973,13 @@ static int exit_ept_violation(struct vcpu_t *vcpu, struct hax_tunnel *htun)
 
 #ifdef CONFIG_HAX_EPT2
     ret = ept_handle_access_violation(&vcpu->vm->gpa_space, &vcpu->vm->ept_tree,
-                                      *qual, gpa);
+                                      *qual, gpa, &fault_gfn);
+    if (ret == -EPERM) {
+        htun->gpaprot.access = (qual->raw >> 3) & 7;
+        htun->gpaprot.gpa = fault_gfn << PG_ORDER_4K;
+        htun->_exit_status = HAX_EXIT_GPAPROT;
+        return HAX_EXIT;
+    }
     if (ret == -EACCES) {
         /*
          * For some reason, during boot-up, Chrome OS guests make hundreds of

diff --git a/include/hax_interface.h b/include/hax_interface.h
@@ -128,6 +128,11 @@ struct hax_tunnel {
         struct {
             paddr_t gla;
         } mmio;
+        struct {
+            paddr_t gpa;
+            uint8_t access;
+            uint8_t pad[7];
+        } gpaprot;
         struct {
             paddr_t dummy;
         } state;
@@ -169,6 +174,7 @@ struct hax_module_version {
 #define HAX_CAP_64BIT_RAMBLOCK     (1 << 3)
 #define HAX_CAP_64BIT_SETRAM       (1 << 4)
 #define HAX_CAP_TUNNEL_PAGE        (1 << 5)
+#define HAX_CAP_GPA_PROTECTION     (1 << 6)
 
 struct hax_capabilityinfo {
     /*
@@ -236,6 +242,14 @@ struct hax_set_ram_info2 {
     uint64_t reserved2;
 } PACKED;
 
+#define HAX_GPA_PROT_MASK    0x7   // one bit each for r/w/e
+#define HAX_GPA_PROT_ALL     0x7   // disable r/w/e all
+struct hax_gpa_prot_info {
+    uint64_t pa_start;
+    uint64_t size;
+    uint64_t flags;
+} PACKED;
+
 /* This interface is support only after API version 2 */
 struct hax_qemu_version {
     /* Current API version in QEMU*/

diff --git a/include/windows/hax_windows.h b/include/windows/hax_windows.h
@@ -116,10 +116,10 @@ static inline void hax_mutex_free(hax_mutex lock)
 }
 
 /* Return true if the bit is set already */
-static int hax_test_and_set_bit(int bit, uint64_t *memory)
+static int hax_test_and_set_bit(uint64 bit, uint64_t *memory)
 {
     long *base = (long *)memory;
-    long nr_long;
+    uint64 nr_long;
     long bitoffset_in_long;
     long bits_per_long = sizeof(long) * 8;
 
@@ -139,10 +139,10 @@ static int hax_test_and_set_bit(int bit, uint64_t *memory)
  * Return true if the bit is cleared already
  * Notice that InterlockedBitTestAndReset return original value in that bit
  */
-static int hax_test_and_clear_bit(int bit, uint64_t *memory)
+static int hax_test_and_clear_bit(uint64 bit, uint64_t *memory)
 {
     long * base = (long *)memory;
-    long nr_long;
+    uint64 nr_long;
     long bitoffset_in_long;
     long bits_per_long = sizeof(long) * 8;
 
@@ -159,9 +159,9 @@ static int hax_test_and_clear_bit(int bit, uint64_t *memory)
 }
 
 /* Don't care for the big endian situation */
-static bool hax_test_bit(int bit, uint64_t *memory)
+static bool hax_test_bit(uint64 bit, uint64_t *memory)
 {
-    int byte = bit / 8;
+    uint64 byte = bit / 8;
     unsigned char *p;
     int offset = bit % 8;
 

diff --git a/windows/hax_entry.c b/windows/hax_entry.c
@@ -581,6 +581,21 @@ NTSTATUS HaxVmControl(PDEVICE_OBJECT DeviceObject, struct hax_vm_windows *ext,
             hax_vm_set_qemuversion(cvm, info);
             break;
         }
+        case HAX_VM_IOCTL_GPA_PROT: {
+            struct hax_gpa_prot_info *info;
+            int res;
+            if (inBufLength < sizeof(struct hax_gpa_prot_info)) {
+                ret = STATUS_INVALID_PARAMETER;
+                goto done;
+            }
+            info = (struct hax_gpa_prot_info *)inBuf;
+            res = hax_vm_gpa_prot(cvm, info);
+            if (res) {
+                ret = res == -EINVAL ? STATUS_INVALID_PARAMETER
+                      : STATUS_UNSUCCESSFUL;
+            }
+            break;
+        }
         default:
             ret = STATUS_INVALID_PARAMETER;
             break;